package com.nulldev.util.security.encryptAPI.impls.nacl_thirdparty;

import java.io.UnsupportedEncodingException;
import java.security.SecureRandom;
import java.util.concurrent.atomic.AtomicLong;

import com.nulldev.util.VariableAPI.util.random.GlobalRandom;
import com.nulldev.util.data.Base64.Base64;

@SuppressWarnings("unused")
public class NaCl {
	public static final class Box {

		private final static String TAG = "Box";

		private AtomicLong nonce;

		private byte[] theirPublicKey;
		private byte[] mySecretKey;
		private byte[] sharedKey;

		public Box(byte[] theirPublicKey, byte[] mySecretKey) {
			this(theirPublicKey, mySecretKey, 68);
		}

		public Box(byte[] theirPublicKey, byte[] mySecretKey, long nonce) {
			this.theirPublicKey = theirPublicKey;
			this.mySecretKey = mySecretKey;

			this.nonce = new AtomicLong(nonce);

			// generate pre-computed shared key
			before();
		}

		public void setNonce(long nonce) {
			this.nonce.set(nonce);
		}

		public long getNonce() {
			return this.nonce.get();
		}

		public long incrNonce() {
			return this.nonce.incrementAndGet();
		}

		private byte[] generateNonce() {
			// generate nonce
			long nonce = this.nonce.get();

			byte[] n = new byte[nonceLength];
			for (int i = 0; i < nonceLength; i += 8) {
				n[i + 0] = (byte) (nonce >>> 0);
				n[i + 1] = (byte) (nonce >>> 8);
				n[i + 2] = (byte) (nonce >>> 16);
				n[i + 3] = (byte) (nonce >>> 24);
				n[i + 4] = (byte) (nonce >>> 32);
				n[i + 5] = (byte) (nonce >>> 40);
				n[i + 6] = (byte) (nonce >>> 48);
				n[i + 7] = (byte) (nonce >>> 56);
			}

			return n;
		}

		/*
		 * @description Encrypt and authenticates message using peer's public key, our
		 * secret key, and the given nonce, which must be unique for each distinct
		 * message for a key pair.
		 *
		 * Returns an encrypted and authenticated message, which is
		 * nacl.box.overheadLength longer than the original message.
		 */
		public byte[] box(byte[] message) {
			if (message == null)
				return null;
			return box(message, 0, message.length);
		}

		public byte[] box(byte[] message, final int moff) {
			if (!(message != null && message.length > moff))
				return null;
			return box(message, moff, message.length - moff);
		}

		public byte[] box(byte[] message, final int moff, final int mlen) {
			if (!(message != null && message.length >= (moff + mlen)))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return after(message, moff, mlen);
		}

		/*
		 * @description Encrypt and authenticates message using peer's public key, our
		 * secret key, and the given nonce, which must be unique for each distinct
		 * message for a key pair.
		 *
		 * Explicitly pass the nonce
		 *
		 * Returns an encrypted and authenticated message, which is
		 * nacl.box.overheadLength longer than the original message.
		 */
		public byte[] box(byte[] message, byte[] theNonce) {
			if (message == null)
				return null;
			return box(message, 0, message.length, theNonce);
		}

		public byte[] box(byte[] message, final int moff, byte[] theNonce) {
			if (!(message != null && message.length > moff))
				return null;
			return box(message, moff, message.length - moff, theNonce);
		}

		public byte[] box(byte[] message, final int moff, final int mlen, byte[] theNonce) {
			if (!(message != null && message.length >= (moff + mlen) && theNonce != null && theNonce.length == nonceLength))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return after(message, moff, mlen, theNonce);
		}

		/*
		 * @description Authenticates and decrypts the given box with peer's public key,
		 * our secret key, and the given nonce.
		 *
		 * Returns the original message, or null if authentication fails.
		 */
		public byte[] open(byte[] box) {
			if (box == null)
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, 0, box.length);
		}

		public byte[] open(byte[] box, final int boxoff) {
			if (!(box != null && box.length > boxoff))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, boxoff, box.length - boxoff);
		}

		public byte[] open(byte[] box, final int boxoff, final int boxlen) {
			if (!(box != null && box.length >= (boxoff + boxlen)))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, boxoff, boxlen);
		}

		/*
		 * @description Authenticates and decrypts the given box with peer's public key,
		 * our secret key, and the given nonce. Explicit passing of nonce Returns the
		 * original message, or null if authentication fails.
		 */
		public byte[] open(byte[] box, byte[] theNonce) {
			if (!(box != null && theNonce != null && theNonce.length == nonceLength))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, 0, box.length, theNonce);
		}

		public byte[] open(byte[] box, final int boxoff, byte[] theNonce) {
			if (!(box != null && box.length > boxoff && theNonce != null && theNonce.length == nonceLength))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, boxoff, box.length - boxoff, theNonce);
		}

		public byte[] open(byte[] box, final int boxoff, final int boxlen, byte[] theNonce) {
			if (!(box != null && box.length >= (boxoff + boxlen) && theNonce != null && theNonce.length == nonceLength))
				return null;

			// prepare shared key
			if (this.sharedKey == null)
				before();

			return open_after(box, boxoff, boxlen, theNonce);
		}

		/*
		 * @description Returns a precomputed shared key which can be used in
		 * nacl.box.after and nacl.box.open.after.
		 */
		public byte[] before() {
			if (this.sharedKey == null) {
				this.sharedKey = new byte[sharedKeyLength];
				crypto_box_beforenm(this.sharedKey, this.theirPublicKey, this.mySecretKey);
			}

			return this.sharedKey;
		}

		/*
		 * @description Same as nacl.box, but uses a shared key precomputed with
		 * nacl.box.before.
		 */
		public byte[] after(byte[] message, final int moff, final int mlen) {
			return after(message, moff, mlen, generateNonce());
		}

		/*
		 * @description Same as nacl.box, but uses a shared key precomputed with
		 * nacl.box.before, and passes a nonce explicitly.
		 */
		public byte[] after(byte[] message, final int moff, final int mlen, byte[] theNonce) {
			// check message
			if (!(message != null && message.length >= (moff + mlen) && theNonce != null && theNonce.length == nonceLength))
				return null;

			// message buffer
			byte[] m = new byte[mlen + zerobytesLength];

			// cipher buffer
			byte[] c = new byte[m.length];

			for (int i = 0; i < mlen; i++)
				m[i + zerobytesLength] = message[i + moff];

			if (0 != crypto_box_afternm(c, m, m.length, theNonce, sharedKey))
				return null;

			// wrap byte_buf_t on c offset@boxzerobytesLength
			/// return new byte_buf_t(c, boxzerobytesLength, c.length-boxzerobytesLength);
			byte[] ret = new byte[c.length - boxzerobytesLength];

			for (int i = 0; i < ret.length; i++)
				ret[i] = c[i + boxzerobytesLength];

			return ret;
		}

		/*
		 * @description Same as nacl.box.open, but uses a shared key pre-computed with
		 * nacl.box.before.
		 */
		public byte[] open_after(byte[] box, final int boxoff, final int boxlen) {
			return open_after(box, boxoff, boxlen, generateNonce());
		}

		public byte[] open_after(byte[] box, final int boxoff, final int boxlen, byte[] theNonce) {
			// check message
			if (!(box != null && box.length >= (boxoff + boxlen) && boxlen >= boxzerobytesLength))
				return null;

			// cipher buffer
			byte[] c = new byte[boxlen + boxzerobytesLength];

			// message buffer
			byte[] m = new byte[c.length];

			for (int i = 0; i < boxlen; i++)
				c[i + boxzerobytesLength] = box[i + boxoff];

			if (crypto_box_open_afternm(m, c, c.length, theNonce, sharedKey) != 0)
				return null;

			// wrap byte_buf_t on m offset@zerobytesLength
			/// return new byte_buf_t(m, zerobytesLength, m.length-zerobytesLength);
			byte[] ret = new byte[m.length - zerobytesLength];

			for (int i = 0; i < ret.length; i++)
				ret[i] = m[i + zerobytesLength];

			return ret;
		}

		/*
		 * @description Length of public key in bytes.
		 */
		public static final int publicKeyLength = 32;

		/*
		 * @description Length of secret key in bytes.
		 */
		public static final int secretKeyLength = 32;

		/*
		 * @description Length of precomputed shared key in bytes.
		 */
		public static final int sharedKeyLength = 32;

		/*
		 * @description Length of nonce in bytes.
		 */
		public static final int nonceLength = 24;

		/*
		 * @description zero bytes in case box
		 */
		public static final int zerobytesLength = 32;
		/*
		 * @description zero bytes in case open box
		 */
		public static final int boxzerobytesLength = 16;

		/*
		 * @description Length of overhead added to box compared to original message.
		 */
		public static final int overheadLength = 16;

		public static class KeyPair {
			private byte[] publicKey;
			private byte[] secretKey;

			public KeyPair() {
				publicKey = new byte[publicKeyLength];
				secretKey = new byte[secretKeyLength];
			}

			public byte[] getPublicKey() {
				return publicKey;
			}

			public byte[] getSecretKey() {
				return secretKey;
			}
		}

		/*
		 * @description Generates a new random key pair for box and returns it as an
		 * object with publicKey and secretKey members:
		 */
		public static KeyPair keyPair() {
			KeyPair kp = new KeyPair();

			crypto_box_keypair(kp.getPublicKey(), kp.getSecretKey());
			return kp;
		}

		public static KeyPair keyPair_fromSecretKey(byte[] secretKey) {
			KeyPair kp = new KeyPair();
			byte[] sk = kp.getSecretKey();
			byte[] pk = kp.getPublicKey();

			// copy sk
			for (int i = 0; i < sk.length; i++)
				sk[i] = secretKey[i];

			crypto_scalarmult_base(pk, sk);
			return kp;
		}

		public byte[] public_key() {
			return this.sharedKey;
		}

	}

	/*
	 * @description Secret Box algorithm, secret key
	 */
	public static final class SecretBox {

		private final static String TAG = "SecretBox";

		private AtomicLong nonce;

		private byte[] key;

		public SecretBox(byte[] key) {
			this(key, 68);
		}

		public SecretBox(byte[] key, long nonce) {
			this.key = key;

			this.nonce = new AtomicLong(nonce);
		}

		public void setNonce(long nonce) {
			this.nonce.set(nonce);
		}

		public long getNonce() {
			return this.nonce.get();
		}

		public long incrNonce() {
			return this.nonce.incrementAndGet();
		}

		private byte[] generateNonce() {
			// generate nonce
			long nonce = this.nonce.get();

			byte[] n = new byte[nonceLength];
			for (int i = 0; i < nonceLength; i += 8) {
				n[i + 0] = (byte) (nonce >>> 0);
				n[i + 1] = (byte) (nonce >>> 8);
				n[i + 2] = (byte) (nonce >>> 16);
				n[i + 3] = (byte) (nonce >>> 24);
				n[i + 4] = (byte) (nonce >>> 32);
				n[i + 5] = (byte) (nonce >>> 40);
				n[i + 6] = (byte) (nonce >>> 48);
				n[i + 7] = (byte) (nonce >>> 56);
			}

			return n;
		}

		/*
		 * @description Encrypt and authenticates message using the key and the nonce.
		 * The nonce must be unique for each distinct message for this key.
		 *
		 * Returns an encrypted and authenticated message, which is
		 * nacl.secretbox.overheadLength longer than the original message.
		 */
		public byte[] box(byte[] message) {
			if (message == null)
				return null;
			return box(message, 0, message.length);
		}

		public byte[] box(byte[] message, final int moff) {
			if (!(message != null && message.length > moff))
				return null;
			return box(message, moff, message.length - moff);
		}

		public byte[] box(byte[] message, final int moff, final int mlen) {
			// check message
			if (!(message != null && message.length >= (moff + mlen)))
				return null;
			return box(message, moff, message.length - moff, generateNonce());
		}

		public byte[] box(byte[] message, byte[] theNonce) {
			if (message == null)
				return null;
			return box(message, 0, message.length, theNonce);
		}

		public byte[] box(byte[] message, final int moff, byte[] theNonce) {
			if (!(message != null && message.length > moff))
				return null;
			return box(message, moff, message.length - moff, theNonce);
		}

		public byte[] box(byte[] message, final int moff, final int mlen, byte[] theNonce) {
			// check message
			if (!(message != null && message.length >= (moff + mlen) && theNonce != null && theNonce.length == nonceLength))
				return null;

			// message buffer
			byte[] m = new byte[mlen + zerobytesLength];

			// cipher buffer
			byte[] c = new byte[m.length];

			for (int i = 0; i < mlen; i++)
				m[i + zerobytesLength] = message[i + moff];

			if (0 != crypto_secretbox(c, m, m.length, theNonce, key))
				return null;

			// TBD optimizing ...
			// wrap byte_buf_t on c offset@boxzerobytesLength
			/// return new byte_buf_t(c, boxzerobytesLength, c.length-boxzerobytesLength);
			byte[] ret = new byte[c.length - boxzerobytesLength];

			for (int i = 0; i < ret.length; i++)
				ret[i] = c[i + boxzerobytesLength];

			return ret;
		}

		/*
		 * @description Authenticates and decrypts the given secret box using the key
		 * and the nonce.
		 *
		 * Returns the original message, or null if authentication fails.
		 */
		public byte[] open(byte[] box) {
			if (box == null)
				return null;
			return open(box, 0, box.length);
		}

		public byte[] open(byte[] box, final int boxoff) {
			if (!(box != null && box.length > boxoff))
				return null;
			return open(box, boxoff, box.length - boxoff);
		}

		public byte[] open(byte[] box, final int boxoff, final int boxlen) {
			// check message
			if (!(box != null && box.length >= (boxoff + boxlen) && boxlen >= boxzerobytesLength))
				return null;
			return open(box, boxoff, box.length - boxoff, generateNonce());
		}

		public byte[] open(byte[] box, byte[] theNonce) {
			if (box == null)
				return null;
			return open(box, 0, box.length, theNonce);
		}

		public byte[] open(byte[] box, final int boxoff, byte[] theNonce) {
			if (!(box != null && box.length > boxoff))
				return null;
			return open(box, boxoff, box.length - boxoff, theNonce);
		}

		public byte[] open(byte[] box, final int boxoff, final int boxlen, byte[] theNonce) {
			// check message
			if (!(box != null && box.length >= (boxoff + boxlen) && boxlen >= boxzerobytesLength && theNonce != null && theNonce.length == nonceLength))
				return null;

			// cipher buffer
			byte[] c = new byte[boxlen + boxzerobytesLength];

			// message buffer
			byte[] m = new byte[c.length];

			for (int i = 0; i < boxlen; i++)
				c[i + boxzerobytesLength] = box[i + boxoff];

			if (0 != crypto_secretbox_open(m, c, c.length, theNonce, key))
				return null;

			// wrap byte_buf_t on m offset@zerobytesLength
			/// return new byte_buf_t(m, zerobytesLength, m.length-zerobytesLength);
			byte[] ret = new byte[m.length - zerobytesLength];

			for (int i = 0; i < ret.length; i++)
				ret[i] = m[i + zerobytesLength];

			return ret;
		}

		/*
		 * @description Length of key in bytes.
		 */
		public static final int keyLength = 32;

		/*
		 * @description Length of nonce in bytes.
		 */
		public static final int nonceLength = 24;

		/*
		 * @description Length of overhead added to secret box compared to original
		 * message.
		 */
		public static final int overheadLength = 16;

		/*
		 * @description zero bytes in case box
		 */
		public static final int zerobytesLength = 32;
		/*
		 * @description zero bytes in case open box
		 */
		public static final int boxzerobytesLength = 16;

		public byte[] get_key() {
			return this.key;
		}

	}

	/*
	 * @description Scalar multiplication, Implements curve25519.
	 */
	public static final class ScalarMult {

		private final static String TAG = "ScalarMult";

		/*
		 * @description Multiplies an integer n by a group element p and returns the
		 * resulting group element.
		 */
		public static byte[] scalseMult(byte[] n, byte[] p) {
			if (!(n.length == scalarLength && p.length == groupElementLength))
				return null;

			byte[] q = new byte[scalarLength];

			crypto_scalarmult(q, n, p);

			return q;
		}

		/*
		 * @description Multiplies an integer n by a standard group element and returns
		 * the resulting group element.
		 */
		public static byte[] scalseMult_base(byte[] n) {
			if (!(n.length == scalarLength))
				return null;

			byte[] q = new byte[scalarLength];

			crypto_scalarmult_base(q, n);

			return q;
		}

		/*
		 * @description Length of scalar in bytes.
		 */
		public static final int scalarLength = 32;

		/*
		 * @description Length of group element in bytes.
		 */
		public static final int groupElementLength = 32;

	}

	/*
	 * @description Hash algorithm, Implements SHA-512.
	 */
	public static final class Hash {

		private final static String TAG = "Hash";

		/*
		 * @description Returns SHA-512 hash of the message.
		 */
		public static byte[] sha512(byte[] message) {
			if (!(message != null && message.length > 0))
				return null;

			byte[] out = new byte[hashLength];

			crypto_hash(out, message);

			return out;
		}

		public static byte[] sha512(String message) throws UnsupportedEncodingException {
			return sha512(message.getBytes("utf-8"));
		}

		/*
		 * @description Length of hash in bytes.
		 */
		public static final int hashLength = 64;

	}

	/*
	 * @description Signature algorithm, Implements ed25519.
	 */
	public static final class Signature {

		private final static String TAG = "Signature";

		private byte[] theirPublicKey;
		private byte[] mySecretKey;

		public Signature(byte[] theirPublicKey, byte[] mySecretKey) {
			this.theirPublicKey = theirPublicKey;
			this.mySecretKey = mySecretKey;
		}

		/*
		 * @description Signs the message using the secret key and returns a signed
		 * message.
		 */
		public byte[] sign(byte[] message) {
			if (message == null)
				return null;

			return sign(message, 0, message.length);
		}

		public byte[] sign(byte[] message, final int moff) {
			if (!(message != null && message.length > moff))
				return null;

			return sign(message, moff, message.length - moff);
		}

		public byte[] sign(byte[] message, final int moff, final int mlen) {
			// check message
			if (!(message != null && message.length >= (moff + mlen)))
				return null;

			// signed message
			byte[] sm = new byte[mlen + signatureLength];

			crypto_sign(sm, -1, message, moff, mlen, mySecretKey);

			return sm;
		}

		/*
		 * @description Verifies the signed message and returns the message without
		 * signature. Returns null if verification failed.
		 */
		public byte[] open(byte[] signedMessage) {
			if (signedMessage == null)
				return null;

			return open(signedMessage, 0, signedMessage.length);
		}

		public byte[] open(byte[] signedMessage, final int smoff) {
			if (!(signedMessage != null && signedMessage.length > smoff))
				return null;

			return open(signedMessage, smoff, signedMessage.length - smoff);
		}

		public byte[] open(byte[] signedMessage, final int smoff, final int smlen) {
			// check sm length
			if (!(signedMessage != null && signedMessage.length >= (smoff + smlen) && smlen >= signatureLength))
				return null;

			// temp buffer
			byte[] tmp = new byte[smlen];

			if (0 != crypto_sign_open(tmp, -1, signedMessage, smoff, smlen, theirPublicKey))
				return null;

			// message
			byte[] msg = new byte[smlen - signatureLength];
			for (int i = 0; i < msg.length; i++)
				msg[i] = signedMessage[smoff + i + signatureLength];

			return msg;
		}

		/*
		 * @description Signs the message using the secret key and returns a signature.
		 */
		public byte[] detached(byte[] message) {
			byte[] signedMsg = this.sign(message);
			byte[] sig = new byte[signatureLength];
			for (int i = 0; i < sig.length; i++)
				sig[i] = signedMsg[i];
			return sig;
		}

		/*
		 * @description Verifies the signature for the message and returns true if
		 * verification succeeded or false if it failed.
		 */
		public boolean detached_verify(byte[] message, byte[] signature) {
			if (signature.length != signatureLength)
				return false;
			if (theirPublicKey.length != publicKeyLength)
				return false;
			byte[] sm = new byte[signatureLength + message.length];
			byte[] m = new byte[signatureLength + message.length];
			for (int i = 0; i < signatureLength; i++)
				sm[i] = signature[i];
			for (int i = 0; i < message.length; i++)
				sm[i + signatureLength] = message[i];
			return (crypto_sign_open(m, -1, sm, 0, sm.length, theirPublicKey) >= 0);
		}

		/*
		 * @description Generates new random key pair for signing and returns it as an
		 * object with publicKey and secretKey members
		 */
		public static class KeyPair {
			private byte[] publicKey;
			private byte[] secretKey;

			public KeyPair() {
				publicKey = new byte[publicKeyLength];
				secretKey = new byte[secretKeyLength];
			}

			public byte[] getPublicKey() {
				return publicKey;
			}

			public byte[] getSecretKey() {
				return secretKey;
			}
		}

		/*
		 * @description Signs the message using the secret key and returns a signed
		 * message.
		 */
		public static KeyPair keyPair() {
			KeyPair kp = new KeyPair();

			crypto_sign_keypair(kp.getPublicKey(), kp.getSecretKey(), false);
			return kp;
		}

		public static KeyPair keyPair_fromSecretKey(byte[] secretKey) {
			KeyPair kp = new KeyPair();
			byte[] pk = kp.getPublicKey();
			byte[] sk = kp.getSecretKey();

			// copy sk
			for (int i = 0; i < kp.getSecretKey().length; i++)
				sk[i] = secretKey[i];

			// copy pk from sk
			for (int i = 0; i < kp.getPublicKey().length; i++)
				pk[i] = secretKey[32 + i]; // hard-copy

			return kp;
		}

		public static KeyPair keyPair_fromSeed(byte[] seed) {
			KeyPair kp = new KeyPair();
			byte[] pk = kp.getPublicKey();
			byte[] sk = kp.getSecretKey();

			// copy sk
			for (int i = 0; i < seedLength; i++)
				sk[i] = seed[i];

			// generate pk from sk
			crypto_sign_keypair(pk, sk, true);

			return kp;
		}

		/*
		 * @description Length of signing public key in bytes.
		 */
		public static final int publicKeyLength = 32;

		/*
		 * @description Length of signing secret key in bytes.
		 */
		public static final int secretKeyLength = 64;

		/*
		 * @description Length of seed for nacl.sign.keyPair.fromSeed in bytes.
		 */
		public static final int seedLength = 32;

		/*
		 * @description Length of signature in bytes.
		 */
		public static final int signatureLength = 64;
	}

	////////////////////////////////////////////////////////////////////////////////////
	/*
	 * @description Codes below are ported tweetnacl-fast.js from
	 * TweetNacl.c/TweetNacl.h
	 */

	private static final byte[] _0 = new byte[16];
	private static final byte[] _9 = new byte[32];
	static {
		/// for (int i = 0; i < _0.length; i ++) _0[i] = 0;

		/// for (int i = 0; i < _9.length; i ++) _9[i] = 0;
		_9[0] = 9;
	}

	private static final long[] gf0 = new long[16];
	private static final long[] gf1 = new long[16];
	private static final long[] _121665 = new long[16];
	static {
		/// for (int i = 0; i < gf0.length; i ++) gf0[i] = 0;

		/// for (int i = 0; i < gf1.length; i ++) gf1[i] = 0;
		gf1[0] = 1;

		/// for (int i = 0; i < _121665.length; i ++) _121665[i] = 0;
		_121665[0] = 0xDB41;
		_121665[1] = 1;
	}

	private static final long[] D = new long[]
		{ 0x78a3, 0x1359, 0x4dca, 0x75eb, 0xd8ab, 0x4141, 0x0a4d, 0x0070, 0xe898, 0x7779, 0x4079, 0x8cc7, 0xfe73, 0x2b6f, 0x6cee, 0x5203 };
	private static final long[] D2 = new long[]
		{ 0xf159, 0x26b2, 0x9b94, 0xebd6, 0xb156, 0x8283, 0x149a, 0x00e0, 0xd130, 0xeef3, 0x80f2, 0x198e, 0xfce7, 0x56df, 0xd9dc, 0x2406 };
	private static final long[] X = new long[]
		{ 0xd51a, 0x8f25, 0x2d60, 0xc956, 0xa7b2, 0x9525, 0xc760, 0x692c, 0xdc5c, 0xfdd6, 0xe231, 0xc0a4, 0x53fe, 0xcd6e, 0x36d3, 0x2169 };
	private static final long[] Y = new long[]
		{ 0x6658, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666, 0x6666 };
	private static final long[] I = new long[]
		{ 0xa0b0, 0x4a0e, 0x1b27, 0xc4ee, 0xe478, 0xad2f, 0x1806, 0x2f43, 0xd7a7, 0x3dfb, 0x0099, 0x2b4d, 0xdf0b, 0x4fc1, 0x2480, 0x2b83 };

	private static void ts64(byte[] x, final int xoff, long u) {
		/// int i;
		/// for (i = 7;i >= 0;--i) { x[i+xoff] = (byte)(u&0xff); u >>>= 8; }

		x[7 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[6 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[5 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[4 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[3 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[2 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[1 + xoff] = (byte) (u & 0xff);
		u >>>= 8;
		x[0 + xoff] = (byte) (u & 0xff); /// u >>>= 8;
	}

	private static int vn(byte[] x, final int xoff, byte[] y, final int yoff, int n) {
		int i, d = 0;
		for (i = 0; i < n; i++)
			d |= (x[i + xoff] ^ y[i + yoff]) & 0xff;
		return (1 & ((d - 1) >>> 8)) - 1;
	}

	private static int crypto_verify_16(byte[] x, final int xoff, byte[] y, final int yoff) {
		return vn(x, xoff, y, yoff, 16);
	}

	public static int crypto_verify_16(byte[] x, byte[] y) {
		return crypto_verify_16(x, 0, y, 0);
	}

	private static int crypto_verify_32(byte[] x, final int xoff, byte[] y, final int yoff) {
		return vn(x, xoff, y, yoff, 32);
	}

	public static int crypto_verify_32(byte[] x, byte[] y) {
		return crypto_verify_32(x, 0, y, 0);
	}

	private static void core_salsa20(byte[] o, byte[] p, byte[] k, byte[] c) {
		int j0 = c[0] & 0xff | (c[1] & 0xff) << 8 | (c[2] & 0xff) << 16 | (c[3] & 0xff) << 24,
				j1 = k[0] & 0xff | (k[1] & 0xff) << 8 | (k[2] & 0xff) << 16 | (k[3] & 0xff) << 24,
				j2 = k[4] & 0xff | (k[5] & 0xff) << 8 | (k[6] & 0xff) << 16 | (k[7] & 0xff) << 24,
				j3 = k[8] & 0xff | (k[9] & 0xff) << 8 | (k[10] & 0xff) << 16 | (k[11] & 0xff) << 24,
				j4 = k[12] & 0xff | (k[13] & 0xff) << 8 | (k[14] & 0xff) << 16 | (k[15] & 0xff) << 24,
				j5 = c[4] & 0xff | (c[5] & 0xff) << 8 | (c[6] & 0xff) << 16 | (c[7] & 0xff) << 24,
				j6 = p[0] & 0xff | (p[1] & 0xff) << 8 | (p[2] & 0xff) << 16 | (p[3] & 0xff) << 24,
				j7 = p[4] & 0xff | (p[5] & 0xff) << 8 | (p[6] & 0xff) << 16 | (p[7] & 0xff) << 24,
				j8 = p[8] & 0xff | (p[9] & 0xff) << 8 | (p[10] & 0xff) << 16 | (p[11] & 0xff) << 24,
				j9 = p[12] & 0xff | (p[13] & 0xff) << 8 | (p[14] & 0xff) << 16 | (p[15] & 0xff) << 24,
				j10 = c[8] & 0xff | (c[9] & 0xff) << 8 | (c[10] & 0xff) << 16 | (c[11] & 0xff) << 24,
				j11 = k[16] & 0xff | (k[17] & 0xff) << 8 | (k[18] & 0xff) << 16 | (k[19] & 0xff) << 24,
				j12 = k[20] & 0xff | (k[21] & 0xff) << 8 | (k[22] & 0xff) << 16 | (k[23] & 0xff) << 24,
				j13 = k[24] & 0xff | (k[25] & 0xff) << 8 | (k[26] & 0xff) << 16 | (k[27] & 0xff) << 24,
				j14 = k[28] & 0xff | (k[29] & 0xff) << 8 | (k[30] & 0xff) << 16 | (k[31] & 0xff) << 24,
				j15 = c[12] & 0xff | (c[13] & 0xff) << 8 | (c[14] & 0xff) << 16 | (c[15] & 0xff) << 24;

		int x0 = j0, x1 = j1, x2 = j2, x3 = j3, x4 = j4, x5 = j5, x6 = j6, x7 = j7, x8 = j8, x9 = j9, x10 = j10, x11 = j11, x12 = j12, x13 = j13, x14 = j14,
				x15 = j15, u;

		for (int i = 0; i < 20; i += 2) {
			u = x0 + x12 | 0;
			x4 ^= u << 7 | u >>> (32 - 7);
			u = x4 + x0 | 0;
			x8 ^= u << 9 | u >>> (32 - 9);
			u = x8 + x4 | 0;
			x12 ^= u << 13 | u >>> (32 - 13);
			u = x12 + x8 | 0;
			x0 ^= u << 18 | u >>> (32 - 18);

			u = x5 + x1 | 0;
			x9 ^= u << 7 | u >>> (32 - 7);
			u = x9 + x5 | 0;
			x13 ^= u << 9 | u >>> (32 - 9);
			u = x13 + x9 | 0;
			x1 ^= u << 13 | u >>> (32 - 13);
			u = x1 + x13 | 0;
			x5 ^= u << 18 | u >>> (32 - 18);

			u = x10 + x6 | 0;
			x14 ^= u << 7 | u >>> (32 - 7);
			u = x14 + x10 | 0;
			x2 ^= u << 9 | u >>> (32 - 9);
			u = x2 + x14 | 0;
			x6 ^= u << 13 | u >>> (32 - 13);
			u = x6 + x2 | 0;
			x10 ^= u << 18 | u >>> (32 - 18);

			u = x15 + x11 | 0;
			x3 ^= u << 7 | u >>> (32 - 7);
			u = x3 + x15 | 0;
			x7 ^= u << 9 | u >>> (32 - 9);
			u = x7 + x3 | 0;
			x11 ^= u << 13 | u >>> (32 - 13);
			u = x11 + x7 | 0;
			x15 ^= u << 18 | u >>> (32 - 18);

			u = x0 + x3 | 0;
			x1 ^= u << 7 | u >>> (32 - 7);
			u = x1 + x0 | 0;
			x2 ^= u << 9 | u >>> (32 - 9);
			u = x2 + x1 | 0;
			x3 ^= u << 13 | u >>> (32 - 13);
			u = x3 + x2 | 0;
			x0 ^= u << 18 | u >>> (32 - 18);

			u = x5 + x4 | 0;
			x6 ^= u << 7 | u >>> (32 - 7);
			u = x6 + x5 | 0;
			x7 ^= u << 9 | u >>> (32 - 9);
			u = x7 + x6 | 0;
			x4 ^= u << 13 | u >>> (32 - 13);
			u = x4 + x7 | 0;
			x5 ^= u << 18 | u >>> (32 - 18);

			u = x10 + x9 | 0;
			x11 ^= u << 7 | u >>> (32 - 7);
			u = x11 + x10 | 0;
			x8 ^= u << 9 | u >>> (32 - 9);
			u = x8 + x11 | 0;
			x9 ^= u << 13 | u >>> (32 - 13);
			u = x9 + x8 | 0;
			x10 ^= u << 18 | u >>> (32 - 18);

			u = x15 + x14 | 0;
			x12 ^= u << 7 | u >>> (32 - 7);
			u = x12 + x15 | 0;
			x13 ^= u << 9 | u >>> (32 - 9);
			u = x13 + x12 | 0;
			x14 ^= u << 13 | u >>> (32 - 13);
			u = x14 + x13 | 0;
			x15 ^= u << 18 | u >>> (32 - 18);
		}
		x0 = x0 + j0 | 0;
		x1 = x1 + j1 | 0;
		x2 = x2 + j2 | 0;
		x3 = x3 + j3 | 0;
		x4 = x4 + j4 | 0;
		x5 = x5 + j5 | 0;
		x6 = x6 + j6 | 0;
		x7 = x7 + j7 | 0;
		x8 = x8 + j8 | 0;
		x9 = x9 + j9 | 0;
		x10 = x10 + j10 | 0;
		x11 = x11 + j11 | 0;
		x12 = x12 + j12 | 0;
		x13 = x13 + j13 | 0;
		x14 = x14 + j14 | 0;
		x15 = x15 + j15 | 0;

		o[0] = (byte) (x0 >>> 0 & 0xff);
		o[1] = (byte) (x0 >>> 8 & 0xff);
		o[2] = (byte) (x0 >>> 16 & 0xff);
		o[3] = (byte) (x0 >>> 24 & 0xff);

		o[4] = (byte) (x1 >>> 0 & 0xff);
		o[5] = (byte) (x1 >>> 8 & 0xff);
		o[6] = (byte) (x1 >>> 16 & 0xff);
		o[7] = (byte) (x1 >>> 24 & 0xff);

		o[8] = (byte) (x2 >>> 0 & 0xff);
		o[9] = (byte) (x2 >>> 8 & 0xff);
		o[10] = (byte) (x2 >>> 16 & 0xff);
		o[11] = (byte) (x2 >>> 24 & 0xff);

		o[12] = (byte) (x3 >>> 0 & 0xff);
		o[13] = (byte) (x3 >>> 8 & 0xff);
		o[14] = (byte) (x3 >>> 16 & 0xff);
		o[15] = (byte) (x3 >>> 24 & 0xff);

		o[16] = (byte) (x4 >>> 0 & 0xff);
		o[17] = (byte) (x4 >>> 8 & 0xff);
		o[18] = (byte) (x4 >>> 16 & 0xff);
		o[19] = (byte) (x4 >>> 24 & 0xff);

		o[20] = (byte) (x5 >>> 0 & 0xff);
		o[21] = (byte) (x5 >>> 8 & 0xff);
		o[22] = (byte) (x5 >>> 16 & 0xff);
		o[23] = (byte) (x5 >>> 24 & 0xff);

		o[24] = (byte) (x6 >>> 0 & 0xff);
		o[25] = (byte) (x6 >>> 8 & 0xff);
		o[26] = (byte) (x6 >>> 16 & 0xff);
		o[27] = (byte) (x6 >>> 24 & 0xff);

		o[28] = (byte) (x7 >>> 0 & 0xff);
		o[29] = (byte) (x7 >>> 8 & 0xff);
		o[30] = (byte) (x7 >>> 16 & 0xff);
		o[31] = (byte) (x7 >>> 24 & 0xff);

		o[32] = (byte) (x8 >>> 0 & 0xff);
		o[33] = (byte) (x8 >>> 8 & 0xff);
		o[34] = (byte) (x8 >>> 16 & 0xff);
		o[35] = (byte) (x8 >>> 24 & 0xff);

		o[36] = (byte) (x9 >>> 0 & 0xff);
		o[37] = (byte) (x9 >>> 8 & 0xff);
		o[38] = (byte) (x9 >>> 16 & 0xff);
		o[39] = (byte) (x9 >>> 24 & 0xff);

		o[40] = (byte) (x10 >>> 0 & 0xff);
		o[41] = (byte) (x10 >>> 8 & 0xff);
		o[42] = (byte) (x10 >>> 16 & 0xff);
		o[43] = (byte) (x10 >>> 24 & 0xff);

		o[44] = (byte) (x11 >>> 0 & 0xff);
		o[45] = (byte) (x11 >>> 8 & 0xff);
		o[46] = (byte) (x11 >>> 16 & 0xff);
		o[47] = (byte) (x11 >>> 24 & 0xff);

		o[48] = (byte) (x12 >>> 0 & 0xff);
		o[49] = (byte) (x12 >>> 8 & 0xff);
		o[50] = (byte) (x12 >>> 16 & 0xff);
		o[51] = (byte) (x12 >>> 24 & 0xff);

		o[52] = (byte) (x13 >>> 0 & 0xff);
		o[53] = (byte) (x13 >>> 8 & 0xff);
		o[54] = (byte) (x13 >>> 16 & 0xff);
		o[55] = (byte) (x13 >>> 24 & 0xff);

		o[56] = (byte) (x14 >>> 0 & 0xff);
		o[57] = (byte) (x14 >>> 8 & 0xff);
		o[58] = (byte) (x14 >>> 16 & 0xff);
		o[59] = (byte) (x14 >>> 24 & 0xff);

		o[60] = (byte) (x15 >>> 0 & 0xff);
		o[61] = (byte) (x15 >>> 8 & 0xff);
		o[62] = (byte) (x15 >>> 16 & 0xff);
		o[63] = (byte) (x15 >>> 24 & 0xff);

		/*
		 * String dbgt = ""; for (int dbg = 0; dbg < o.length; dbg ++) dbgt +=
		 * " "+o[dbg]; Log.d(TAG, "core_salsa20 -> "+dbgt);
		 */
	}

	private static void core_hsalsa20(byte[] o, byte[] p, byte[] k, byte[] c) {
		int j0 = c[0] & 0xff | (c[1] & 0xff) << 8 | (c[2] & 0xff) << 16 | (c[3] & 0xff) << 24,
				j1 = k[0] & 0xff | (k[1] & 0xff) << 8 | (k[2] & 0xff) << 16 | (k[3] & 0xff) << 24,
				j2 = k[4] & 0xff | (k[5] & 0xff) << 8 | (k[6] & 0xff) << 16 | (k[7] & 0xff) << 24,
				j3 = k[8] & 0xff | (k[9] & 0xff) << 8 | (k[10] & 0xff) << 16 | (k[11] & 0xff) << 24,
				j4 = k[12] & 0xff | (k[13] & 0xff) << 8 | (k[14] & 0xff) << 16 | (k[15] & 0xff) << 24,
				j5 = c[4] & 0xff | (c[5] & 0xff) << 8 | (c[6] & 0xff) << 16 | (c[7] & 0xff) << 24,
				j6 = p[0] & 0xff | (p[1] & 0xff) << 8 | (p[2] & 0xff) << 16 | (p[3] & 0xff) << 24,
				j7 = p[4] & 0xff | (p[5] & 0xff) << 8 | (p[6] & 0xff) << 16 | (p[7] & 0xff) << 24,
				j8 = p[8] & 0xff | (p[9] & 0xff) << 8 | (p[10] & 0xff) << 16 | (p[11] & 0xff) << 24,
				j9 = p[12] & 0xff | (p[13] & 0xff) << 8 | (p[14] & 0xff) << 16 | (p[15] & 0xff) << 24,
				j10 = c[8] & 0xff | (c[9] & 0xff) << 8 | (c[10] & 0xff) << 16 | (c[11] & 0xff) << 24,
				j11 = k[16] & 0xff | (k[17] & 0xff) << 8 | (k[18] & 0xff) << 16 | (k[19] & 0xff) << 24,
				j12 = k[20] & 0xff | (k[21] & 0xff) << 8 | (k[22] & 0xff) << 16 | (k[23] & 0xff) << 24,
				j13 = k[24] & 0xff | (k[25] & 0xff) << 8 | (k[26] & 0xff) << 16 | (k[27] & 0xff) << 24,
				j14 = k[28] & 0xff | (k[29] & 0xff) << 8 | (k[30] & 0xff) << 16 | (k[31] & 0xff) << 24,
				j15 = c[12] & 0xff | (c[13] & 0xff) << 8 | (c[14] & 0xff) << 16 | (c[15] & 0xff) << 24;

		int x0 = j0, x1 = j1, x2 = j2, x3 = j3, x4 = j4, x5 = j5, x6 = j6, x7 = j7, x8 = j8, x9 = j9, x10 = j10, x11 = j11, x12 = j12, x13 = j13, x14 = j14,
				x15 = j15, u;

		for (int i = 0; i < 20; i += 2) {
			u = x0 + x12 | 0;
			x4 ^= u << 7 | u >>> (32 - 7);
			u = x4 + x0 | 0;
			x8 ^= u << 9 | u >>> (32 - 9);
			u = x8 + x4 | 0;
			x12 ^= u << 13 | u >>> (32 - 13);
			u = x12 + x8 | 0;
			x0 ^= u << 18 | u >>> (32 - 18);

			u = x5 + x1 | 0;
			x9 ^= u << 7 | u >>> (32 - 7);
			u = x9 + x5 | 0;
			x13 ^= u << 9 | u >>> (32 - 9);
			u = x13 + x9 | 0;
			x1 ^= u << 13 | u >>> (32 - 13);
			u = x1 + x13 | 0;
			x5 ^= u << 18 | u >>> (32 - 18);

			u = x10 + x6 | 0;
			x14 ^= u << 7 | u >>> (32 - 7);
			u = x14 + x10 | 0;
			x2 ^= u << 9 | u >>> (32 - 9);
			u = x2 + x14 | 0;
			x6 ^= u << 13 | u >>> (32 - 13);
			u = x6 + x2 | 0;
			x10 ^= u << 18 | u >>> (32 - 18);

			u = x15 + x11 | 0;
			x3 ^= u << 7 | u >>> (32 - 7);
			u = x3 + x15 | 0;
			x7 ^= u << 9 | u >>> (32 - 9);
			u = x7 + x3 | 0;
			x11 ^= u << 13 | u >>> (32 - 13);
			u = x11 + x7 | 0;
			x15 ^= u << 18 | u >>> (32 - 18);

			u = x0 + x3 | 0;
			x1 ^= u << 7 | u >>> (32 - 7);
			u = x1 + x0 | 0;
			x2 ^= u << 9 | u >>> (32 - 9);
			u = x2 + x1 | 0;
			x3 ^= u << 13 | u >>> (32 - 13);
			u = x3 + x2 | 0;
			x0 ^= u << 18 | u >>> (32 - 18);

			u = x5 + x4 | 0;
			x6 ^= u << 7 | u >>> (32 - 7);
			u = x6 + x5 | 0;
			x7 ^= u << 9 | u >>> (32 - 9);
			u = x7 + x6 | 0;
			x4 ^= u << 13 | u >>> (32 - 13);
			u = x4 + x7 | 0;
			x5 ^= u << 18 | u >>> (32 - 18);

			u = x10 + x9 | 0;
			x11 ^= u << 7 | u >>> (32 - 7);
			u = x11 + x10 | 0;
			x8 ^= u << 9 | u >>> (32 - 9);
			u = x8 + x11 | 0;
			x9 ^= u << 13 | u >>> (32 - 13);
			u = x9 + x8 | 0;
			x10 ^= u << 18 | u >>> (32 - 18);

			u = x15 + x14 | 0;
			x12 ^= u << 7 | u >>> (32 - 7);
			u = x12 + x15 | 0;
			x13 ^= u << 9 | u >>> (32 - 9);
			u = x13 + x12 | 0;
			x14 ^= u << 13 | u >>> (32 - 13);
			u = x14 + x13 | 0;
			x15 ^= u << 18 | u >>> (32 - 18);
		}

		o[0] = (byte) (x0 >>> 0 & 0xff);
		o[1] = (byte) (x0 >>> 8 & 0xff);
		o[2] = (byte) (x0 >>> 16 & 0xff);
		o[3] = (byte) (x0 >>> 24 & 0xff);

		o[4] = (byte) (x5 >>> 0 & 0xff);
		o[5] = (byte) (x5 >>> 8 & 0xff);
		o[6] = (byte) (x5 >>> 16 & 0xff);
		o[7] = (byte) (x5 >>> 24 & 0xff);

		o[8] = (byte) (x10 >>> 0 & 0xff);
		o[9] = (byte) (x10 >>> 8 & 0xff);
		o[10] = (byte) (x10 >>> 16 & 0xff);
		o[11] = (byte) (x10 >>> 24 & 0xff);

		o[12] = (byte) (x15 >>> 0 & 0xff);
		o[13] = (byte) (x15 >>> 8 & 0xff);
		o[14] = (byte) (x15 >>> 16 & 0xff);
		o[15] = (byte) (x15 >>> 24 & 0xff);

		o[16] = (byte) (x6 >>> 0 & 0xff);
		o[17] = (byte) (x6 >>> 8 & 0xff);
		o[18] = (byte) (x6 >>> 16 & 0xff);
		o[19] = (byte) (x6 >>> 24 & 0xff);

		o[20] = (byte) (x7 >>> 0 & 0xff);
		o[21] = (byte) (x7 >>> 8 & 0xff);
		o[22] = (byte) (x7 >>> 16 & 0xff);
		o[23] = (byte) (x7 >>> 24 & 0xff);

		o[24] = (byte) (x8 >>> 0 & 0xff);
		o[25] = (byte) (x8 >>> 8 & 0xff);
		o[26] = (byte) (x8 >>> 16 & 0xff);
		o[27] = (byte) (x8 >>> 24 & 0xff);

		o[28] = (byte) (x9 >>> 0 & 0xff);
		o[29] = (byte) (x9 >>> 8 & 0xff);
		o[30] = (byte) (x9 >>> 16 & 0xff);
		o[31] = (byte) (x9 >>> 24 & 0xff);

		/*
		 * String dbgt = ""; for (int dbg = 0; dbg < o.length; dbg ++) dbgt +=
		 * " "+o[dbg]; Log.d(TAG, "core_hsalsa20 -> "+dbgt);
		 */
	}

	public static int crypto_core_salsa20(byte[] out, byte[] in, byte[] k, byte[] c) {
		/// core(out,in,k,c,0);
		core_salsa20(out, in, k, c);

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < out.length; dbg ++) dbgt += " "+out[dbg];
		/// L/og.d(TAG, "crypto_core_salsa20 -> "+dbgt);

		return 0;
	}

	public static int crypto_core_hsalsa20(byte[] out, byte[] in, byte[] k, byte[] c) {
		/// core(out,in,k,c,1);
		core_hsalsa20(out, in, k, c);

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < out.length; dbg ++) dbgt += " "+out[dbg];
		/// L/og.d(TAG, "crypto_core_hsalsa20 -> "+dbgt);

		return 0;
	}

	// "expand 32-byte k"
	private static final byte[] sigma =
		{ 101, 120, 112, 97, 110, 100, 32, 51, 50, 45, 98, 121, 116, 101, 32, 107 };

	/*
	 * static { try { sigma = "expand 32-byte k".getBytes("utf-8"); } catch
	 * (UnsupportedEncodingException e) { e.printStackTrace(); } }
	 */

	private static int crypto_stream_salsa20_xor(byte[] c, int cpos, byte[] m, int mpos, long b, byte[] n, byte[] k) {
		byte[] z = new byte[16], x = new byte[64];
		int u, i;
		for (i = 0; i < 16; i++)
			z[i] = 0;
		for (i = 0; i < 8; i++)
			z[i] = n[i];
		while (b >= 64) {
			crypto_core_salsa20(x, z, k, sigma);
			for (i = 0; i < 64; i++)
				c[cpos + i] = (byte) ((m[mpos + i] ^ x[i]) & 0xff);
			u = 1;
			for (i = 8; i < 16; i++) {
				u = u + (z[i] & 0xff) | 0;
				z[i] = (byte) (u & 0xff);
				u >>>= 8;
			}
			b -= 64;
			cpos += 64;
			mpos += 64;
		}
		if (b > 0) {
			crypto_core_salsa20(x, z, k, sigma);
			for (i = 0; i < b; i++)
				c[cpos + i] = (byte) ((m[mpos + i] ^ x[i]) & 0xff);
		}

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < c.length-cpos; dbg ++) dbgt += " "+c[dbg +cpos];
		/// Log.d(TAG, "crypto_stream_salsa20_xor, c -> "+dbgt);

		return 0;
	}

	public static int crypto_stream_salsa20(byte[] c, int cpos, long b, byte[] n, byte[] k) {
		byte[] z = new byte[16], x = new byte[64];
		int u, i;
		for (i = 0; i < 16; i++)
			z[i] = 0;
		for (i = 0; i < 8; i++)
			z[i] = n[i];
		while (b >= 64) {
			crypto_core_salsa20(x, z, k, sigma);
			for (i = 0; i < 64; i++)
				c[cpos + i] = x[i];
			u = 1;
			for (i = 8; i < 16; i++) {
				u = u + (z[i] & 0xff) | 0;
				z[i] = (byte) (u & 0xff);
				u >>>= 8;
			}
			b -= 64;
			cpos += 64;
		}
		if (b > 0) {
			crypto_core_salsa20(x, z, k, sigma);
			for (i = 0; i < b; i++)
				c[cpos + i] = x[i];
		}

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < c.length-cpos; dbg ++) dbgt += " "+c[dbg +cpos];
		/// Log.d(TAG, "crypto_stream_salsa20, c -> "+dbgt);

		return 0;
	}

	public static int crypto_stream(byte[] c, int cpos, long d, byte[] n, byte[] k) {
		byte[] s = new byte[32];
		crypto_core_hsalsa20(s, n, k, sigma);
		byte[] sn = new byte[8];
		for (int i = 0; i < 8; i++)
			sn[i] = n[i + 16];
		return crypto_stream_salsa20(c, cpos, d, sn, s);
	}

	public static int crypto_stream_xor(byte[] c, int cpos, byte[] m, int mpos, long d, byte[] n, byte[] k) {
		byte[] s = new byte[32];

		/*
		 * String dbgt = ""; for (int dbg = 0; dbg < n.length; dbg ++) dbgt +=
		 * " "+n[dbg]; Log.d(TAG, "crypto_stream_xor, nonce -> "+dbgt);
		 * 
		 * dbgt = ""; for (int dbg = 0; dbg < k.length; dbg ++) dbgt += " "+k[dbg];
		 * Log.d(TAG, "crypto_stream_xor, shk -> "+dbgt);
		 */

		crypto_core_hsalsa20(s, n, k, sigma);
		byte[] sn = new byte[8];
		for (int i = 0; i < 8; i++)
			sn[i] = n[i + 16];
		return crypto_stream_salsa20_xor(c, cpos, m, mpos, d, sn, s);
	}

	/*
	 * Port of Andrew Moon's Poly1305-donna-16. Public domain.
	 * https://github.com/floodyberry/poly1305-donna
	 */
	public static final class poly1305 {

		private byte[] buffer;
		private int[] r;
		private int[] h;
		private int[] pad;
		private int leftover;
		private int fin;

		public poly1305(byte[] key) {
			this.buffer = new byte[16];
			this.r = new int[10];
			this.h = new int[10];
			this.pad = new int[8];
			this.leftover = 0;
			this.fin = 0;

			int t0, t1, t2, t3, t4, t5, t6, t7;

			t0 = key[0] & 0xff | (key[1] & 0xff) << 8;
			this.r[0] = (t0) & 0x1fff;
			t1 = key[2] & 0xff | (key[3] & 0xff) << 8;
			this.r[1] = ((t0 >>> 13) | (t1 << 3)) & 0x1fff;
			t2 = key[4] & 0xff | (key[5] & 0xff) << 8;
			this.r[2] = ((t1 >>> 10) | (t2 << 6)) & 0x1f03;
			t3 = key[6] & 0xff | (key[7] & 0xff) << 8;
			this.r[3] = ((t2 >>> 7) | (t3 << 9)) & 0x1fff;
			t4 = key[8] & 0xff | (key[9] & 0xff) << 8;
			this.r[4] = ((t3 >>> 4) | (t4 << 12)) & 0x00ff;
			this.r[5] = ((t4 >>> 1)) & 0x1ffe;
			t5 = key[10] & 0xff | (key[11] & 0xff) << 8;
			this.r[6] = ((t4 >>> 14) | (t5 << 2)) & 0x1fff;
			t6 = key[12] & 0xff | (key[13] & 0xff) << 8;
			this.r[7] = ((t5 >>> 11) | (t6 << 5)) & 0x1f81;
			t7 = key[14] & 0xff | (key[15] & 0xff) << 8;
			this.r[8] = ((t6 >>> 8) | (t7 << 8)) & 0x1fff;
			this.r[9] = ((t7 >>> 5)) & 0x007f;

			this.pad[0] = key[16] & 0xff | (key[17] & 0xff) << 8;
			this.pad[1] = key[18] & 0xff | (key[19] & 0xff) << 8;
			this.pad[2] = key[20] & 0xff | (key[21] & 0xff) << 8;
			this.pad[3] = key[22] & 0xff | (key[23] & 0xff) << 8;
			this.pad[4] = key[24] & 0xff | (key[25] & 0xff) << 8;
			this.pad[5] = key[26] & 0xff | (key[27] & 0xff) << 8;
			this.pad[6] = key[28] & 0xff | (key[29] & 0xff) << 8;
			this.pad[7] = key[30] & 0xff | (key[31] & 0xff) << 8;
		}

		public poly1305 blocks(byte[] m, int mpos, int bytes) {
			int hibit = this.fin != 0 ? 0 : (1 << 11);
			int t0, t1, t2, t3, t4, t5, t6, t7, c;
			int d0, d1, d2, d3, d4, d5, d6, d7, d8, d9;

			int h0 = this.h[0], h1 = this.h[1], h2 = this.h[2], h3 = this.h[3], h4 = this.h[4], h5 = this.h[5], h6 = this.h[6], h7 = this.h[7], h8 = this.h[8],
					h9 = this.h[9];

			int r0 = this.r[0], r1 = this.r[1], r2 = this.r[2], r3 = this.r[3], r4 = this.r[4], r5 = this.r[5], r6 = this.r[6], r7 = this.r[7], r8 = this.r[8],
					r9 = this.r[9];

			while (bytes >= 16) {
				t0 = m[mpos + 0] & 0xff | (m[mpos + 1] & 0xff) << 8;
				h0 += (t0) & 0x1fff;
				t1 = m[mpos + 2] & 0xff | (m[mpos + 3] & 0xff) << 8;
				h1 += ((t0 >>> 13) | (t1 << 3)) & 0x1fff;
				t2 = m[mpos + 4] & 0xff | (m[mpos + 5] & 0xff) << 8;
				h2 += ((t1 >>> 10) | (t2 << 6)) & 0x1fff;
				t3 = m[mpos + 6] & 0xff | (m[mpos + 7] & 0xff) << 8;
				h3 += ((t2 >>> 7) | (t3 << 9)) & 0x1fff;
				t4 = m[mpos + 8] & 0xff | (m[mpos + 9] & 0xff) << 8;
				h4 += ((t3 >>> 4) | (t4 << 12)) & 0x1fff;
				h5 += ((t4 >>> 1)) & 0x1fff;
				t5 = m[mpos + 10] & 0xff | (m[mpos + 11] & 0xff) << 8;
				h6 += ((t4 >>> 14) | (t5 << 2)) & 0x1fff;
				t6 = m[mpos + 12] & 0xff | (m[mpos + 13] & 0xff) << 8;
				h7 += ((t5 >>> 11) | (t6 << 5)) & 0x1fff;
				t7 = m[mpos + 14] & 0xff | (m[mpos + 15] & 0xff) << 8;
				h8 += ((t6 >>> 8) | (t7 << 8)) & 0x1fff;
				h9 += ((t7 >>> 5)) | hibit;

				c = 0;

				d0 = c;
				d0 += h0 * r0;
				d0 += h1 * (5 * r9);
				d0 += h2 * (5 * r8);
				d0 += h3 * (5 * r7);
				d0 += h4 * (5 * r6);
				c = (d0 >>> 13);
				d0 &= 0x1fff;
				d0 += h5 * (5 * r5);
				d0 += h6 * (5 * r4);
				d0 += h7 * (5 * r3);
				d0 += h8 * (5 * r2);
				d0 += h9 * (5 * r1);
				c += (d0 >>> 13);
				d0 &= 0x1fff;

				d1 = c;
				d1 += h0 * r1;
				d1 += h1 * r0;
				d1 += h2 * (5 * r9);
				d1 += h3 * (5 * r8);
				d1 += h4 * (5 * r7);
				c = (d1 >>> 13);
				d1 &= 0x1fff;
				d1 += h5 * (5 * r6);
				d1 += h6 * (5 * r5);
				d1 += h7 * (5 * r4);
				d1 += h8 * (5 * r3);
				d1 += h9 * (5 * r2);
				c += (d1 >>> 13);
				d1 &= 0x1fff;

				d2 = c;
				d2 += h0 * r2;
				d2 += h1 * r1;
				d2 += h2 * r0;
				d2 += h3 * (5 * r9);
				d2 += h4 * (5 * r8);
				c = (d2 >>> 13);
				d2 &= 0x1fff;
				d2 += h5 * (5 * r7);
				d2 += h6 * (5 * r6);
				d2 += h7 * (5 * r5);
				d2 += h8 * (5 * r4);
				d2 += h9 * (5 * r3);
				c += (d2 >>> 13);
				d2 &= 0x1fff;

				d3 = c;
				d3 += h0 * r3;
				d3 += h1 * r2;
				d3 += h2 * r1;
				d3 += h3 * r0;
				d3 += h4 * (5 * r9);
				c = (d3 >>> 13);
				d3 &= 0x1fff;
				d3 += h5 * (5 * r8);
				d3 += h6 * (5 * r7);
				d3 += h7 * (5 * r6);
				d3 += h8 * (5 * r5);
				d3 += h9 * (5 * r4);
				c += (d3 >>> 13);
				d3 &= 0x1fff;

				d4 = c;
				d4 += h0 * r4;
				d4 += h1 * r3;
				d4 += h2 * r2;
				d4 += h3 * r1;
				d4 += h4 * r0;
				c = (d4 >>> 13);
				d4 &= 0x1fff;
				d4 += h5 * (5 * r9);
				d4 += h6 * (5 * r8);
				d4 += h7 * (5 * r7);
				d4 += h8 * (5 * r6);
				d4 += h9 * (5 * r5);
				c += (d4 >>> 13);
				d4 &= 0x1fff;

				d5 = c;
				d5 += h0 * r5;
				d5 += h1 * r4;
				d5 += h2 * r3;
				d5 += h3 * r2;
				d5 += h4 * r1;
				c = (d5 >>> 13);
				d5 &= 0x1fff;
				d5 += h5 * r0;
				d5 += h6 * (5 * r9);
				d5 += h7 * (5 * r8);
				d5 += h8 * (5 * r7);
				d5 += h9 * (5 * r6);
				c += (d5 >>> 13);
				d5 &= 0x1fff;

				d6 = c;
				d6 += h0 * r6;
				d6 += h1 * r5;
				d6 += h2 * r4;
				d6 += h3 * r3;
				d6 += h4 * r2;
				c = (d6 >>> 13);
				d6 &= 0x1fff;
				d6 += h5 * r1;
				d6 += h6 * r0;
				d6 += h7 * (5 * r9);
				d6 += h8 * (5 * r8);
				d6 += h9 * (5 * r7);
				c += (d6 >>> 13);
				d6 &= 0x1fff;

				d7 = c;
				d7 += h0 * r7;
				d7 += h1 * r6;
				d7 += h2 * r5;
				d7 += h3 * r4;
				d7 += h4 * r3;
				c = (d7 >>> 13);
				d7 &= 0x1fff;
				d7 += h5 * r2;
				d7 += h6 * r1;
				d7 += h7 * r0;
				d7 += h8 * (5 * r9);
				d7 += h9 * (5 * r8);
				c += (d7 >>> 13);
				d7 &= 0x1fff;

				d8 = c;
				d8 += h0 * r8;
				d8 += h1 * r7;
				d8 += h2 * r6;
				d8 += h3 * r5;
				d8 += h4 * r4;
				c = (d8 >>> 13);
				d8 &= 0x1fff;
				d8 += h5 * r3;
				d8 += h6 * r2;
				d8 += h7 * r1;
				d8 += h8 * r0;
				d8 += h9 * (5 * r9);
				c += (d8 >>> 13);
				d8 &= 0x1fff;

				d9 = c;
				d9 += h0 * r9;
				d9 += h1 * r8;
				d9 += h2 * r7;
				d9 += h3 * r6;
				d9 += h4 * r5;
				c = (d9 >>> 13);
				d9 &= 0x1fff;
				d9 += h5 * r4;
				d9 += h6 * r3;
				d9 += h7 * r2;
				d9 += h8 * r1;
				d9 += h9 * r0;
				c += (d9 >>> 13);
				d9 &= 0x1fff;

				c = (((c << 2) + c)) | 0;
				c = (c + d0) | 0;
				d0 = c & 0x1fff;
				c = (c >>> 13);
				d1 += c;

				h0 = d0;
				h1 = d1;
				h2 = d2;
				h3 = d3;
				h4 = d4;
				h5 = d5;
				h6 = d6;
				h7 = d7;
				h8 = d8;
				h9 = d9;

				mpos += 16;
				bytes -= 16;
			}
			this.h[0] = h0;
			this.h[1] = h1;
			this.h[2] = h2;
			this.h[3] = h3;
			this.h[4] = h4;
			this.h[5] = h5;
			this.h[6] = h6;
			this.h[7] = h7;
			this.h[8] = h8;
			this.h[9] = h9;

			return this;
		}

		public poly1305 finish(byte[] mac, int macpos) {
			int[] g = new int[10];
			int c, mask, f, i;

			if (this.leftover != 0) {
				i = this.leftover;
				this.buffer[i++] = 1;
				for (; i < 16; i++)
					this.buffer[i] = 0;
				this.fin = 1;
				this.blocks(this.buffer, 0, 16);
			}

			c = this.h[1] >>> 13;
			this.h[1] &= 0x1fff;
			for (i = 2; i < 10; i++) {
				this.h[i] += c;
				c = this.h[i] >>> 13;
				this.h[i] &= 0x1fff;
			}
			this.h[0] += (c * 5);
			c = this.h[0] >>> 13;
			this.h[0] &= 0x1fff;
			this.h[1] += c;
			c = this.h[1] >>> 13;
			this.h[1] &= 0x1fff;
			this.h[2] += c;

			g[0] = this.h[0] + 5;
			c = g[0] >>> 13;
			g[0] &= 0x1fff;
			for (i = 1; i < 10; i++) {
				g[i] = this.h[i] + c;
				c = g[i] >>> 13;
				g[i] &= 0x1fff;
			}
			g[9] -= (1 << 13);
			g[9] &= 0xffff;

			/*
			 * backport from tweetnacl-fast.js
			 * https://github.com/dchest/tweetnacl-js/releases/tag/v0.14.3 <<< "The issue
			 * was not properly detecting if st->h was >= 2^130 - 5, coupled with [testing
			 * mistake] not catching the failure. The chance of the bug affecting anything
			 * in the real world is essentially zero luckily, but it's good to have it
			 * fixed." >>>
			 */
			/// change mask = (g[9] >>> ((2 * 8) - 1)) - 1; to as
			mask = (c ^ 1) - 1;
			mask &= 0xffff;
			///////////////////////////////////////

			for (i = 0; i < 10; i++)
				g[i] &= mask;
			mask = ~mask;
			for (i = 0; i < 10; i++)
				this.h[i] = (this.h[i] & mask) | g[i];

			this.h[0] = ((this.h[0]) | (this.h[1] << 13)) & 0xffff;
			this.h[1] = ((this.h[1] >>> 3) | (this.h[2] << 10)) & 0xffff;
			this.h[2] = ((this.h[2] >>> 6) | (this.h[3] << 7)) & 0xffff;
			this.h[3] = ((this.h[3] >>> 9) | (this.h[4] << 4)) & 0xffff;
			this.h[4] = ((this.h[4] >>> 12) | (this.h[5] << 1) | (this.h[6] << 14)) & 0xffff;
			this.h[5] = ((this.h[6] >>> 2) | (this.h[7] << 11)) & 0xffff;
			this.h[6] = ((this.h[7] >>> 5) | (this.h[8] << 8)) & 0xffff;
			this.h[7] = ((this.h[8] >>> 8) | (this.h[9] << 5)) & 0xffff;

			f = this.h[0] + this.pad[0];
			this.h[0] = f & 0xffff;
			for (i = 1; i < 8; i++) {
				f = (((this.h[i] + this.pad[i]) | 0) + (f >>> 16)) | 0;
				this.h[i] = f & 0xffff;
			}

			mac[macpos + 0] = (byte) ((this.h[0] >>> 0) & 0xff);
			mac[macpos + 1] = (byte) ((this.h[0] >>> 8) & 0xff);
			mac[macpos + 2] = (byte) ((this.h[1] >>> 0) & 0xff);
			mac[macpos + 3] = (byte) ((this.h[1] >>> 8) & 0xff);
			mac[macpos + 4] = (byte) ((this.h[2] >>> 0) & 0xff);
			mac[macpos + 5] = (byte) ((this.h[2] >>> 8) & 0xff);
			mac[macpos + 6] = (byte) ((this.h[3] >>> 0) & 0xff);
			mac[macpos + 7] = (byte) ((this.h[3] >>> 8) & 0xff);
			mac[macpos + 8] = (byte) ((this.h[4] >>> 0) & 0xff);
			mac[macpos + 9] = (byte) ((this.h[4] >>> 8) & 0xff);
			mac[macpos + 10] = (byte) ((this.h[5] >>> 0) & 0xff);
			mac[macpos + 11] = (byte) ((this.h[5] >>> 8) & 0xff);
			mac[macpos + 12] = (byte) ((this.h[6] >>> 0) & 0xff);
			mac[macpos + 13] = (byte) ((this.h[6] >>> 8) & 0xff);
			mac[macpos + 14] = (byte) ((this.h[7] >>> 0) & 0xff);
			mac[macpos + 15] = (byte) ((this.h[7] >>> 8) & 0xff);

			return this;
		}

		public poly1305 update(byte[] m, int mpos, int bytes) {
			int i, want;

			if (this.leftover != 0) {
				want = (16 - this.leftover);
				if (want > bytes)
					want = bytes;
				for (i = 0; i < want; i++)
					this.buffer[this.leftover + i] = m[mpos + i];
				bytes -= want;
				mpos += want;
				this.leftover += want;
				if (this.leftover < 16)
					return this;
				this.blocks(buffer, 0, 16);
				this.leftover = 0;
			}

			if (bytes >= 16) {
				want = bytes - (bytes % 16);
				this.blocks(m, mpos, want);
				mpos += want;
				bytes -= want;
			}

			if (bytes != 0) {
				for (i = 0; i < bytes; i++)
					this.buffer[this.leftover + i] = m[mpos + i];
				this.leftover += bytes;
			}

			return this;
		}

	}

	private static int crypto_onetimeauth(byte[] out, final int outpos, byte[] m, final int mpos, int n, byte[] k) {
		poly1305 s = new poly1305(k);
		s.update(m, mpos, n);
		s.finish(out, outpos);

		/*
		 * String dbgt = ""; for (int dbg = 0; dbg < out.length-outpos; dbg ++) dbgt +=
		 * " "+out[dbg+outpos]; Log.d(TAG, "crypto_onetimeauth -> "+dbgt);
		 */

		return 0;
	}

	public static int crypto_onetimeauth(byte[] out, byte[] m, int /* long */ n, byte[] k) {
		return crypto_onetimeauth(out, 0, m, 0, n, k);
	}

	private static int crypto_onetimeauth_verify(byte[] h, final int hoff, byte[] m, final int moff, int /* long */ n, byte[] k) {
		byte[] x = new byte[16];
		crypto_onetimeauth(x, 0, m, moff, n, k);
		return crypto_verify_16(h, hoff, x, 0);
	}

	public static int crypto_onetimeauth_verify(byte[] h, byte[] m, int /* long */ n, byte[] k) {
		return crypto_onetimeauth_verify(h, 0, m, 0, n, k);
	}

	public static int crypto_onetimeauth_verify(byte[] h, byte[] m, byte[] k) {
		return crypto_onetimeauth_verify(h, m, m != null ? m.length : 0, k);
	}

	public static int crypto_secretbox(byte[] c, byte[] m, int /* long */ d, byte[] n, byte[] k) {
		int i;
		if (d < 32)
			return -1;
		crypto_stream_xor(c, 0, m, 0, d, n, k);
		crypto_onetimeauth(c, 16, c, 32, d - 32, c);
		/// for (i = 0; i < 16; i++) c[i] = 0;
		return 0;
	}

	public static int crypto_secretbox_open(byte[] m, byte[] c, int /* long */ d, byte[] n, byte[] k) {
		int i;
		byte[] x = new byte[32];
		if (d < 32)
			return -1;
		crypto_stream(x, 0, 32, n, k);
		if (crypto_onetimeauth_verify(c, 16, c, 32, d - 32, x) != 0)
			return -1;
		crypto_stream_xor(m, 0, c, 0, d, n, k);
		/// for (i = 0; i < 32; i++) m[i] = 0;
		return 0;
	}

	private static void set25519(long[] r, long[] a) {
		int i;
		for (i = 0; i < 16; i++)
			r[i] = a[i];
	}

	private static void car25519(long[] o) {
		int i;
		long v, c = 1;
		for (i = 0; i < 16; i++) {
			v = o[i] + c + 65535;
			c = v >> 16;
			o[i] = v - c * 65536;
		}
		o[0] += c - 1 + 37 * (c - 1);
	}

	private static void sel25519(long[] p, long[] q, int b) {
		sel25519(p, 0, q, 0, b);
	}

	private static void sel25519(long[] p, final int poff, long[] q, final int qoff, int b) {
		long t, c = ~(b - 1);
		for (int i = 0; i < 16; i++) {
			t = c & (p[i + poff] ^ q[i + qoff]);
			p[i + poff] ^= t;
			q[i + qoff] ^= t;
		}
	}

	private static void pack25519(byte[] o, long[] n, final int noff) {
		int i, j, b;
		long[] m = new long[16], t = new long[16];
		for (i = 0; i < 16; i++)
			t[i] = n[i + noff];
		car25519(t);
		car25519(t);
		car25519(t);
		for (j = 0; j < 2; j++) {
			m[0] = t[0] - 0xffed;
			for (i = 1; i < 15; i++) {
				m[i] = t[i] - 0xffff - ((m[i - 1] >> 16) & 1);
				m[i - 1] &= 0xffff;
			}
			m[15] = t[15] - 0x7fff - ((m[14] >> 16) & 1);
			b = (int) ((m[15] >> 16) & 1);
			m[14] &= 0xffff;
			sel25519(t, 0, m, 0, 1 - b);
		}
		for (i = 0; i < 16; i++) {
			o[2 * i] = (byte) (t[i] & 0xff);
			o[2 * i + 1] = (byte) (t[i] >> 8);
		}
	}

	private static int neq25519(long[] a, long[] b) {
		return neq25519(a, 0, b, 0);
	}

	private static int neq25519(long[] a, final int aoff, long[] b, final int boff) {
		byte[] c = new byte[32], d = new byte[32];
		pack25519(c, a, aoff);
		pack25519(d, b, boff);
		return crypto_verify_32(c, 0, d, 0);
	}

	private static byte par25519(long[] a) {
		return par25519(a, 0);
	}

	private static byte par25519(long[] a, final int aoff) {
		byte[] d = new byte[32];
		pack25519(d, a, aoff);
		return (byte) (d[0] & 1);
	}

	private static void unpack25519(long[] o, byte[] n) {
		int i;
		for (i = 0; i < 16; i++)
			o[i] = (n[2 * i] & 0xff) + ((long) ((n[2 * i + 1] << 8) & 0xffff));
		o[15] &= 0x7fff;
	}

	private static void A(long[] o, long[] a, long[] b) {
		A(o, 0, a, 0, b, 0);
	}

	private static void A(long[] o, final int ooff, long[] a, final int aoff, long[] b, final int boff) {
		int i;
		for (i = 0; i < 16; i++)
			o[i + ooff] = a[i + aoff] + b[i + boff];
	}

	private static void Z(long[] o, long[] a, long[] b) {
		Z(o, 0, a, 0, b, 0);
	}

	private static void Z(long[] o, final int ooff, long[] a, final int aoff, long[] b, final int boff) {
		int i;
		for (i = 0; i < 16; i++)
			o[i + ooff] = a[i + aoff] - b[i + boff];
	}

	private static void M(long[] o, long[] a, long[] b) {
		M(o, 0, a, 0, b, 0);
	}

	private static void M(long[] o, final int ooff, long[] a, final int aoff, long[] b, final int boff) {
		long v, c, t0 = 0, t1 = 0, t2 = 0, t3 = 0, t4 = 0, t5 = 0, t6 = 0, t7 = 0, t8 = 0, t9 = 0, t10 = 0, t11 = 0, t12 = 0, t13 = 0, t14 = 0, t15 = 0,
				t16 = 0, t17 = 0, t18 = 0, t19 = 0, t20 = 0, t21 = 0, t22 = 0, t23 = 0, t24 = 0, t25 = 0, t26 = 0, t27 = 0, t28 = 0, t29 = 0, t30 = 0,
				b0 = b[0 + boff], b1 = b[1 + boff], b2 = b[2 + boff], b3 = b[3 + boff], b4 = b[4 + boff], b5 = b[5 + boff], b6 = b[6 + boff], b7 = b[7 + boff],
				b8 = b[8 + boff], b9 = b[9 + boff], b10 = b[10 + boff], b11 = b[11 + boff], b12 = b[12 + boff], b13 = b[13 + boff], b14 = b[14 + boff],
				b15 = b[15 + boff];

		v = a[0 + aoff];
		t0 += v * b0;
		t1 += v * b1;
		t2 += v * b2;
		t3 += v * b3;
		t4 += v * b4;
		t5 += v * b5;
		t6 += v * b6;
		t7 += v * b7;
		t8 += v * b8;
		t9 += v * b9;
		t10 += v * b10;
		t11 += v * b11;
		t12 += v * b12;
		t13 += v * b13;
		t14 += v * b14;
		t15 += v * b15;
		v = a[1 + aoff];
		t1 += v * b0;
		t2 += v * b1;
		t3 += v * b2;
		t4 += v * b3;
		t5 += v * b4;
		t6 += v * b5;
		t7 += v * b6;
		t8 += v * b7;
		t9 += v * b8;
		t10 += v * b9;
		t11 += v * b10;
		t12 += v * b11;
		t13 += v * b12;
		t14 += v * b13;
		t15 += v * b14;
		t16 += v * b15;
		v = a[2 + aoff];
		t2 += v * b0;
		t3 += v * b1;
		t4 += v * b2;
		t5 += v * b3;
		t6 += v * b4;
		t7 += v * b5;
		t8 += v * b6;
		t9 += v * b7;
		t10 += v * b8;
		t11 += v * b9;
		t12 += v * b10;
		t13 += v * b11;
		t14 += v * b12;
		t15 += v * b13;
		t16 += v * b14;
		t17 += v * b15;
		v = a[3 + aoff];
		t3 += v * b0;
		t4 += v * b1;
		t5 += v * b2;
		t6 += v * b3;
		t7 += v * b4;
		t8 += v * b5;
		t9 += v * b6;
		t10 += v * b7;
		t11 += v * b8;
		t12 += v * b9;
		t13 += v * b10;
		t14 += v * b11;
		t15 += v * b12;
		t16 += v * b13;
		t17 += v * b14;
		t18 += v * b15;
		v = a[4 + aoff];
		t4 += v * b0;
		t5 += v * b1;
		t6 += v * b2;
		t7 += v * b3;
		t8 += v * b4;
		t9 += v * b5;
		t10 += v * b6;
		t11 += v * b7;
		t12 += v * b8;
		t13 += v * b9;
		t14 += v * b10;
		t15 += v * b11;
		t16 += v * b12;
		t17 += v * b13;
		t18 += v * b14;
		t19 += v * b15;
		v = a[5 + aoff];
		t5 += v * b0;
		t6 += v * b1;
		t7 += v * b2;
		t8 += v * b3;
		t9 += v * b4;
		t10 += v * b5;
		t11 += v * b6;
		t12 += v * b7;
		t13 += v * b8;
		t14 += v * b9;
		t15 += v * b10;
		t16 += v * b11;
		t17 += v * b12;
		t18 += v * b13;
		t19 += v * b14;
		t20 += v * b15;
		v = a[6 + aoff];
		t6 += v * b0;
		t7 += v * b1;
		t8 += v * b2;
		t9 += v * b3;
		t10 += v * b4;
		t11 += v * b5;
		t12 += v * b6;
		t13 += v * b7;
		t14 += v * b8;
		t15 += v * b9;
		t16 += v * b10;
		t17 += v * b11;
		t18 += v * b12;
		t19 += v * b13;
		t20 += v * b14;
		t21 += v * b15;
		v = a[7 + aoff];
		t7 += v * b0;
		t8 += v * b1;
		t9 += v * b2;
		t10 += v * b3;
		t11 += v * b4;
		t12 += v * b5;
		t13 += v * b6;
		t14 += v * b7;
		t15 += v * b8;
		t16 += v * b9;
		t17 += v * b10;
		t18 += v * b11;
		t19 += v * b12;
		t20 += v * b13;
		t21 += v * b14;
		t22 += v * b15;
		v = a[8 + aoff];
		t8 += v * b0;
		t9 += v * b1;
		t10 += v * b2;
		t11 += v * b3;
		t12 += v * b4;
		t13 += v * b5;
		t14 += v * b6;
		t15 += v * b7;
		t16 += v * b8;
		t17 += v * b9;
		t18 += v * b10;
		t19 += v * b11;
		t20 += v * b12;
		t21 += v * b13;
		t22 += v * b14;
		t23 += v * b15;
		v = a[9 + aoff];
		t9 += v * b0;
		t10 += v * b1;
		t11 += v * b2;
		t12 += v * b3;
		t13 += v * b4;
		t14 += v * b5;
		t15 += v * b6;
		t16 += v * b7;
		t17 += v * b8;
		t18 += v * b9;
		t19 += v * b10;
		t20 += v * b11;
		t21 += v * b12;
		t22 += v * b13;
		t23 += v * b14;
		t24 += v * b15;
		v = a[10 + aoff];
		t10 += v * b0;
		t11 += v * b1;
		t12 += v * b2;
		t13 += v * b3;
		t14 += v * b4;
		t15 += v * b5;
		t16 += v * b6;
		t17 += v * b7;
		t18 += v * b8;
		t19 += v * b9;
		t20 += v * b10;
		t21 += v * b11;
		t22 += v * b12;
		t23 += v * b13;
		t24 += v * b14;
		t25 += v * b15;
		v = a[11 + aoff];
		t11 += v * b0;
		t12 += v * b1;
		t13 += v * b2;
		t14 += v * b3;
		t15 += v * b4;
		t16 += v * b5;
		t17 += v * b6;
		t18 += v * b7;
		t19 += v * b8;
		t20 += v * b9;
		t21 += v * b10;
		t22 += v * b11;
		t23 += v * b12;
		t24 += v * b13;
		t25 += v * b14;
		t26 += v * b15;
		v = a[12 + aoff];
		t12 += v * b0;
		t13 += v * b1;
		t14 += v * b2;
		t15 += v * b3;
		t16 += v * b4;
		t17 += v * b5;
		t18 += v * b6;
		t19 += v * b7;
		t20 += v * b8;
		t21 += v * b9;
		t22 += v * b10;
		t23 += v * b11;
		t24 += v * b12;
		t25 += v * b13;
		t26 += v * b14;
		t27 += v * b15;
		v = a[13 + aoff];
		t13 += v * b0;
		t14 += v * b1;
		t15 += v * b2;
		t16 += v * b3;
		t17 += v * b4;
		t18 += v * b5;
		t19 += v * b6;
		t20 += v * b7;
		t21 += v * b8;
		t22 += v * b9;
		t23 += v * b10;
		t24 += v * b11;
		t25 += v * b12;
		t26 += v * b13;
		t27 += v * b14;
		t28 += v * b15;
		v = a[14 + aoff];
		t14 += v * b0;
		t15 += v * b1;
		t16 += v * b2;
		t17 += v * b3;
		t18 += v * b4;
		t19 += v * b5;
		t20 += v * b6;
		t21 += v * b7;
		t22 += v * b8;
		t23 += v * b9;
		t24 += v * b10;
		t25 += v * b11;
		t26 += v * b12;
		t27 += v * b13;
		t28 += v * b14;
		t29 += v * b15;
		v = a[15 + aoff];
		t15 += v * b0;
		t16 += v * b1;
		t17 += v * b2;
		t18 += v * b3;
		t19 += v * b4;
		t20 += v * b5;
		t21 += v * b6;
		t22 += v * b7;
		t23 += v * b8;
		t24 += v * b9;
		t25 += v * b10;
		t26 += v * b11;
		t27 += v * b12;
		t28 += v * b13;
		t29 += v * b14;
		t30 += v * b15;

		t0 += 38 * t16;
		t1 += 38 * t17;
		t2 += 38 * t18;
		t3 += 38 * t19;
		t4 += 38 * t20;
		t5 += 38 * t21;
		t6 += 38 * t22;
		t7 += 38 * t23;
		t8 += 38 * t24;
		t9 += 38 * t25;
		t10 += 38 * t26;
		t11 += 38 * t27;
		t12 += 38 * t28;
		t13 += 38 * t29;
		t14 += 38 * t30;
		// t15 left as is

		// first car
		c = 1;
		v = t0 + c + 65535;
		c = v >> 16;
		t0 = v - c * 65536;
		v = t1 + c + 65535;
		c = v >> 16;
		t1 = v - c * 65536;
		v = t2 + c + 65535;
		c = v >> 16;
		t2 = v - c * 65536;
		v = t3 + c + 65535;
		c = v >> 16;
		t3 = v - c * 65536;
		v = t4 + c + 65535;
		c = v >> 16;
		t4 = v - c * 65536;
		v = t5 + c + 65535;
		c = v >> 16;
		t5 = v - c * 65536;
		v = t6 + c + 65535;
		c = v >> 16;
		t6 = v - c * 65536;
		v = t7 + c + 65535;
		c = v >> 16;
		t7 = v - c * 65536;
		v = t8 + c + 65535;
		c = v >> 16;
		t8 = v - c * 65536;
		v = t9 + c + 65535;
		c = v >> 16;
		t9 = v - c * 65536;
		v = t10 + c + 65535;
		c = v >> 16;
		t10 = v - c * 65536;
		v = t11 + c + 65535;
		c = v >> 16;
		t11 = v - c * 65536;
		v = t12 + c + 65535;
		c = v >> 16;
		t12 = v - c * 65536;
		v = t13 + c + 65535;
		c = v >> 16;
		t13 = v - c * 65536;
		v = t14 + c + 65535;
		c = v >> 16;
		t14 = v - c * 65536;
		v = t15 + c + 65535;
		c = v >> 16;
		t15 = v - c * 65536;
		t0 += c - 1 + 37 * (c - 1);

		// second car
		c = 1;
		v = t0 + c + 65535;
		c = v >> 16;
		t0 = v - c * 65536;
		v = t1 + c + 65535;
		c = v >> 16;
		t1 = v - c * 65536;
		v = t2 + c + 65535;
		c = v >> 16;
		t2 = v - c * 65536;
		v = t3 + c + 65535;
		c = v >> 16;
		t3 = v - c * 65536;
		v = t4 + c + 65535;
		c = v >> 16;
		t4 = v - c * 65536;
		v = t5 + c + 65535;
		c = v >> 16;
		t5 = v - c * 65536;
		v = t6 + c + 65535;
		c = v >> 16;
		t6 = v - c * 65536;
		v = t7 + c + 65535;
		c = v >> 16;
		t7 = v - c * 65536;
		v = t8 + c + 65535;
		c = v >> 16;
		t8 = v - c * 65536;
		v = t9 + c + 65535;
		c = v >> 16;
		t9 = v - c * 65536;
		v = t10 + c + 65535;
		c = v >> 16;
		t10 = v - c * 65536;
		v = t11 + c + 65535;
		c = v >> 16;
		t11 = v - c * 65536;
		v = t12 + c + 65535;
		c = v >> 16;
		t12 = v - c * 65536;
		v = t13 + c + 65535;
		c = v >> 16;
		t13 = v - c * 65536;
		v = t14 + c + 65535;
		c = v >> 16;
		t14 = v - c * 65536;
		v = t15 + c + 65535;
		c = v >> 16;
		t15 = v - c * 65536;
		t0 += c - 1 + 37 * (c - 1);

		o[0 + ooff] = t0;
		o[1 + ooff] = t1;
		o[2 + ooff] = t2;
		o[3 + ooff] = t3;
		o[4 + ooff] = t4;
		o[5 + ooff] = t5;
		o[6 + ooff] = t6;
		o[7 + ooff] = t7;
		o[8 + ooff] = t8;
		o[9 + ooff] = t9;
		o[10 + ooff] = t10;
		o[11 + ooff] = t11;
		o[12 + ooff] = t12;
		o[13 + ooff] = t13;
		o[14 + ooff] = t14;
		o[15 + ooff] = t15;
	}

	private static void S(long[] o, long[] a) {
		S(o, 0, a, 0);
	}

	private static void S(long[] o, final int ooff, long[] a, final int aoff) {
		M(o, ooff, a, aoff, a, aoff);
	}

	private static void inv25519(long[] o, final int ooff, long[] i, final int ioff) {
		long[] c = new long[16];
		int a;
		for (a = 0; a < 16; a++)
			c[a] = i[a + ioff];
		for (a = 253; a >= 0; a--) {
			S(c, 0, c, 0);
			if (a != 2 && a != 4)
				M(c, 0, c, 0, i, ioff);
		}
		for (a = 0; a < 16; a++)
			o[a + ooff] = c[a];
	}

	private static void pow2523(long[] o, long[] i) {
		long[] c = new long[16];
		int a;

		for (a = 0; a < 16; a++)
			c[a] = i[a];

		for (a = 250; a >= 0; a--) {
			S(c, 0, c, 0);
			if (a != 1)
				M(c, 0, c, 0, i, 0);
		}

		for (a = 0; a < 16; a++)
			o[a] = c[a];
	}

	public static int crypto_scalarmult(byte[] q, byte[] n, byte[] p) {
		byte[] z = new byte[32];
		long[] x = new long[80];
		int r, i;
		long[] a = new long[16], b = new long[16], c = new long[16], d = new long[16], e = new long[16], f = new long[16];
		for (i = 0; i < 31; i++)
			z[i] = n[i];
		z[31] = (byte) (((n[31] & 127) | 64) & 0xff);
		z[0] &= 248;
		unpack25519(x, p);
		for (i = 0; i < 16; i++) {
			b[i] = x[i];
			d[i] = a[i] = c[i] = 0;
		}
		a[0] = d[0] = 1;
		for (i = 254; i >= 0; --i) {
			r = (z[i >>> 3] >>> (i & 7)) & 1;
			sel25519(a, b, r);
			sel25519(c, d, r);
			A(e, a, c);
			Z(a, a, c);
			A(c, b, d);
			Z(b, b, d);
			S(d, e);
			S(f, a);
			M(a, c, a);
			M(c, b, e);
			A(e, a, c);
			Z(a, a, c);
			S(b, a);
			Z(c, d, f);
			M(a, c, _121665);
			A(a, a, d);
			M(c, c, a);
			M(a, d, f);
			M(d, b, x);
			S(b, e);
			sel25519(a, b, r);
			sel25519(c, d, r);
		}
		for (i = 0; i < 16; i++) {
			x[i + 16] = a[i];
			x[i + 32] = c[i];
			x[i + 48] = b[i];
			x[i + 64] = d[i];
		}
		inv25519(x, 32, x, 32);
		M(x, 16, x, 16, x, 32);
		pack25519(q, x, 16);

		return 0;
	}

	public static int crypto_scalarmult_base(byte[] q, byte[] n) {
		return crypto_scalarmult(q, n, _9);
	}

	public static int crypto_box_keypair(byte[] y, byte[] x) {
		randombytes(x, 32);
		return crypto_scalarmult_base(y, x);
	}

	public static int crypto_box_beforenm(byte[] k, byte[] y, byte[] x) {
		byte[] s = new byte[32];
		crypto_scalarmult(s, x, y);

		/*
		 * String dbgt = ""; for (int dbg = 0; dbg < s.length; dbg ++) dbgt +=
		 * " "+s[dbg]; Log.d(TAG, "crypto_box_beforenm -> "+dbgt);
		 * 
		 * dbgt = ""; for (int dbg = 0; dbg < x.length; dbg ++) dbgt += " "+x[dbg];
		 * Log.d(TAG, "crypto_box_beforenm, x -> "+dbgt);
		 * 
		 * dbgt = ""; for (int dbg = 0; dbg < y.length; dbg ++) dbgt += " "+y[dbg];
		 * Log.d(TAG, "crypto_box_beforenm, y -> "+dbgt);
		 */

		return crypto_core_hsalsa20(k, _0, s, sigma);
	}

	public static int crypto_box_afternm(byte[] c, byte[] m, int /* long */ d, byte[] n, byte[] k) {
		return crypto_secretbox(c, m, d, n, k);
	}

	public static int crypto_box_open_afternm(byte[] m, byte[] c, int /* long */ d, byte[] n, byte[] k) {
		return crypto_secretbox_open(m, c, d, n, k);
	}

	public static int crypto_box(byte[] c, byte[] m, int /* long */ d, byte[] n, byte[] y, byte[] x) {
		byte[] k = new byte[32];

		/// L/og.d(TAG, "crypto_box start ...");

		crypto_box_beforenm(k, y, x);
		return crypto_box_afternm(c, m, d, n, k);
	}

	public static int crypto_box_open(byte[] m, byte[] c, int /* long */ d, byte[] n, byte[] y, byte[] x) {
		byte[] k = new byte[32];
		crypto_box_beforenm(k, y, x);
		return crypto_box_open_afternm(m, c, d, n, k);
	}

	private static final long K[] =
		{ 0x428a2f98d728ae22L, 0x7137449123ef65cdL, 0xb5c0fbcfec4d3b2fL, 0xe9b5dba58189dbbcL, 0x3956c25bf348b538L, 0x59f111f1b605d019L, 0x923f82a4af194f9bL,
				0xab1c5ed5da6d8118L, 0xd807aa98a3030242L, 0x12835b0145706fbeL, 0x243185be4ee4b28cL, 0x550c7dc3d5ffb4e2L, 0x72be5d74f27b896fL,
				0x80deb1fe3b1696b1L, 0x9bdc06a725c71235L, 0xc19bf174cf692694L, 0xe49b69c19ef14ad2L, 0xefbe4786384f25e3L, 0x0fc19dc68b8cd5b5L,
				0x240ca1cc77ac9c65L, 0x2de92c6f592b0275L, 0x4a7484aa6ea6e483L, 0x5cb0a9dcbd41fbd4L, 0x76f988da831153b5L, 0x983e5152ee66dfabL,
				0xa831c66d2db43210L, 0xb00327c898fb213fL, 0xbf597fc7beef0ee4L, 0xc6e00bf33da88fc2L, 0xd5a79147930aa725L, 0x06ca6351e003826fL,
				0x142929670a0e6e70L, 0x27b70a8546d22ffcL, 0x2e1b21385c26c926L, 0x4d2c6dfc5ac42aedL, 0x53380d139d95b3dfL, 0x650a73548baf63deL,
				0x766a0abb3c77b2a8L, 0x81c2c92e47edaee6L, 0x92722c851482353bL, 0xa2bfe8a14cf10364L, 0xa81a664bbc423001L, 0xc24b8b70d0f89791L,
				0xc76c51a30654be30L, 0xd192e819d6ef5218L, 0xd69906245565a910L, 0xf40e35855771202aL, 0x106aa07032bbd1b8L, 0x19a4c116b8d2d0c8L,
				0x1e376c085141ab53L, 0x2748774cdf8eeb99L, 0x34b0bcb5e19b48a8L, 0x391c0cb3c5c95a63L, 0x4ed8aa4ae3418acbL, 0x5b9cca4f7763e373L,
				0x682e6ff3d6b2b8a3L, 0x748f82ee5defb2fcL, 0x78a5636f43172f60L, 0x84c87814a1f0ab72L, 0x8cc702081a6439ecL, 0x90befffa23631e28L,
				0xa4506cebde82bde9L, 0xbef9a3f7b2c67915L, 0xc67178f2e372532bL, 0xca273eceea26619cL, 0xd186b8c721c0c207L, 0xeada7dd6cde0eb1eL,
				0xf57d4f7fee6ed178L, 0x06f067aa72176fbaL, 0x0a637dc5a2c898a6L, 0x113f9804bef90daeL, 0x1b710b35131c471bL, 0x28db77f523047d84L,
				0x32caab7b40c72493L, 0x3c9ebe0a15c9bebcL, 0x431d67c49c100d4cL, 0x4cc5d4becb3e42b6L, 0x597f299cfc657e2aL, 0x5fcb6fab3ad6faecL,
				0x6c44198c4a475817L };

	private static int crypto_hashblocks_hl(int[] hh, int[] hl, byte[] m, final int moff, int n) {

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < n; dbg ++) dbgt += " "+m[dbg+moff];
		/// Log.d(TAG, "crypto_hashblocks_hl m/"+n + "-> "+dbgt);

		int[] wh = new int[16], wl = new int[16];
		int bh0, bh1, bh2, bh3, bh4, bh5, bh6, bh7, bl0, bl1, bl2, bl3, bl4, bl5, bl6, bl7, th, tl, h, l, i, j, a, b, c, d;

		int ah0 = hh[0], ah1 = hh[1], ah2 = hh[2], ah3 = hh[3], ah4 = hh[4], ah5 = hh[5], ah6 = hh[6], ah7 = hh[7],

				al0 = hl[0], al1 = hl[1], al2 = hl[2], al3 = hl[3], al4 = hl[4], al5 = hl[5], al6 = hl[6], al7 = hl[7];

		int pos = 0;
		while (n >= 128) {
			for (i = 0; i < 16; i++) {
				j = 8 * i + pos;
				wh[i] = ((m[j + 0 + moff] & 0xff) << 24) | ((m[j + 1 + moff] & 0xff) << 16) | ((m[j + 2 + moff] & 0xff) << 8) | ((m[j + 3 + moff] & 0xff) << 0);
				wl[i] = ((m[j + 4 + moff] & 0xff) << 24) | ((m[j + 5 + moff] & 0xff) << 16) | ((m[j + 6 + moff] & 0xff) << 8) | ((m[j + 7 + moff] & 0xff) << 0);
			}
			for (i = 0; i < 80; i++) {
				bh0 = ah0;
				bh1 = ah1;
				bh2 = ah2;
				bh3 = ah3;
				bh4 = ah4;
				bh5 = ah5;
				bh6 = ah6;
				bh7 = ah7;

				bl0 = al0;
				bl1 = al1;
				bl2 = al2;
				bl3 = al3;
				bl4 = al4;
				bl5 = al5;
				bl6 = al6;
				bl7 = al7;

				// add
				h = ah7;
				l = al7;

				a = l & 0xffff;
				b = l >>> 16;
				c = h & 0xffff;
				d = h >>> 16;

				// Sigma1
				h = ((ah4 >>> 14) | (al4 << (32 - 14))) ^ ((ah4 >>> 18) | (al4 << (32 - 18))) ^ ((al4 >>> (41 - 32)) | (ah4 << (32 - (41 - 32))));
				l = ((al4 >>> 14) | (ah4 << (32 - 14))) ^ ((al4 >>> 18) | (ah4 << (32 - 18))) ^ ((ah4 >>> (41 - 32)) | (al4 << (32 - (41 - 32))));

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				// Ch
				h = (ah4 & ah5) ^ (~ah4 & ah6);
				l = (al4 & al5) ^ (~al4 & al6);

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				// K
				/// h = K[i*2];
				/// l = K[i*2+1];
				h = (int) ((K[i] >>> 32) & 0xffffffff);
				l = (int) ((K[i] >>> 0) & 0xffffffff);

				/// Log.d(TAG, "i"+i + ",h:0x"+Integer.toHexString(h) +
				/// ",l:0x"+Integer.toHexString(l));

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				// w
				h = wh[i % 16];
				l = wl[i % 16];

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				b += a >>> 16;
				c += b >>> 16;
				d += c >>> 16;

				th = c & 0xffff | d << 16;
				tl = a & 0xffff | b << 16;

				// add
				h = th;
				l = tl;

				a = l & 0xffff;
				b = l >>> 16;
				c = h & 0xffff;
				d = h >>> 16;

				// Sigma0
				h = ((ah0 >>> 28) | (al0 << (32 - 28))) ^ ((al0 >>> (34 - 32)) | (ah0 << (32 - (34 - 32)))) ^ ((al0 >>> (39 - 32)) | (ah0 << (32 - (39 - 32))));
				l = ((al0 >>> 28) | (ah0 << (32 - 28))) ^ ((ah0 >>> (34 - 32)) | (al0 << (32 - (34 - 32)))) ^ ((ah0 >>> (39 - 32)) | (al0 << (32 - (39 - 32))));

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				// Maj
				h = (ah0 & ah1) ^ (ah0 & ah2) ^ (ah1 & ah2);
				l = (al0 & al1) ^ (al0 & al2) ^ (al1 & al2);

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				b += a >>> 16;
				c += b >>> 16;
				d += c >>> 16;

				bh7 = (c & 0xffff) | (d << 16);
				bl7 = (a & 0xffff) | (b << 16);

				// add
				h = bh3;
				l = bl3;

				a = l & 0xffff;
				b = l >>> 16;
				c = h & 0xffff;
				d = h >>> 16;

				h = th;
				l = tl;

				a += l & 0xffff;
				b += l >>> 16;
				c += h & 0xffff;
				d += h >>> 16;

				b += a >>> 16;
				c += b >>> 16;
				d += c >>> 16;

				bh3 = (c & 0xffff) | (d << 16);
				bl3 = (a & 0xffff) | (b << 16);

				ah1 = bh0;
				ah2 = bh1;
				ah3 = bh2;
				ah4 = bh3;
				ah5 = bh4;
				ah6 = bh5;
				ah7 = bh6;
				ah0 = bh7;

				al1 = bl0;
				al2 = bl1;
				al3 = bl2;
				al4 = bl3;
				al5 = bl4;
				al6 = bl5;
				al7 = bl6;
				al0 = bl7;

				if (i % 16 == 15) {
					for (j = 0; j < 16; j++) {
						// add
						h = wh[j];
						l = wl[j];

						a = l & 0xffff;
						b = l >>> 16;
						c = h & 0xffff;
						d = h >>> 16;

						h = wh[(j + 9) % 16];
						l = wl[(j + 9) % 16];

						a += l & 0xffff;
						b += l >>> 16;
						c += h & 0xffff;
						d += h >>> 16;

						// sigma0
						th = wh[(j + 1) % 16];
						tl = wl[(j + 1) % 16];
						h = ((th >>> 1) | (tl << (32 - 1))) ^ ((th >>> 8) | (tl << (32 - 8))) ^ (th >>> 7);
						l = ((tl >>> 1) | (th << (32 - 1))) ^ ((tl >>> 8) | (th << (32 - 8))) ^ ((tl >>> 7) | (th << (32 - 7)));

						a += l & 0xffff;
						b += l >>> 16;
						c += h & 0xffff;
						d += h >>> 16;

						// sigma1
						th = wh[(j + 14) % 16];
						tl = wl[(j + 14) % 16];
						h = ((th >>> 19) | (tl << (32 - 19))) ^ ((tl >>> (61 - 32)) | (th << (32 - (61 - 32)))) ^ (th >>> 6);
						l = ((tl >>> 19) | (th << (32 - 19))) ^ ((th >>> (61 - 32)) | (tl << (32 - (61 - 32)))) ^ ((tl >>> 6) | (th << (32 - 6)));

						a += l & 0xffff;
						b += l >>> 16;
						c += h & 0xffff;
						d += h >>> 16;

						b += a >>> 16;
						c += b >>> 16;
						d += c >>> 16;

						wh[j] = (c & 0xffff) | (d << 16);
						wl[j] = (a & 0xffff) | (b << 16);
					}
				}
			}

			// add
			h = ah0;
			l = al0;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[0];
			l = hl[0];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[0] = ah0 = (c & 0xffff) | (d << 16);
			hl[0] = al0 = (a & 0xffff) | (b << 16);

			h = ah1;
			l = al1;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[1];
			l = hl[1];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[1] = ah1 = (c & 0xffff) | (d << 16);
			hl[1] = al1 = (a & 0xffff) | (b << 16);

			h = ah2;
			l = al2;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[2];
			l = hl[2];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[2] = ah2 = (c & 0xffff) | (d << 16);
			hl[2] = al2 = (a & 0xffff) | (b << 16);

			h = ah3;
			l = al3;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[3];
			l = hl[3];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[3] = ah3 = (c & 0xffff) | (d << 16);
			hl[3] = al3 = (a & 0xffff) | (b << 16);

			h = ah4;
			l = al4;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[4];
			l = hl[4];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[4] = ah4 = (c & 0xffff) | (d << 16);
			hl[4] = al4 = (a & 0xffff) | (b << 16);

			h = ah5;
			l = al5;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[5];
			l = hl[5];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[5] = ah5 = (c & 0xffff) | (d << 16);
			hl[5] = al5 = (a & 0xffff) | (b << 16);

			h = ah6;
			l = al6;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[6];
			l = hl[6];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[6] = ah6 = (c & 0xffff) | (d << 16);
			hl[6] = al6 = (a & 0xffff) | (b << 16);

			h = ah7;
			l = al7;

			a = l & 0xffff;
			b = l >>> 16;
			c = h & 0xffff;
			d = h >>> 16;

			h = hh[7];
			l = hl[7];

			a += l & 0xffff;
			b += l >>> 16;
			c += h & 0xffff;
			d += h >>> 16;

			b += a >>> 16;
			c += b >>> 16;
			d += c >>> 16;

			hh[7] = ah7 = (c & 0xffff) | (d << 16);
			hl[7] = al7 = (a & 0xffff) | (b << 16);

			pos += 128;
			n -= 128;

			/*
			 * dbgt = ""; for (int dbg = 0; dbg < hh.length; dbg ++) dbgt += " "+hh[dbg];
			 * Log.d(TAG, "\ncrypto_hashblocks_hl hh -> "+dbgt);
			 * 
			 * dbgt = ""; for (int dbg = 0; dbg < hl.length; dbg ++) dbgt += " "+hl[dbg];
			 * Log.d(TAG, "\ncrypto_hashblocks_hl hl -> "+dbgt);
			 */
		}

		return n;
	}

	// TBD 64bits of n
	/// int crypto_hash(byte [] out, byte [] m, long n)
	public static int crypto_hash(byte[] out, byte[] m, final int moff, int n) {
		int[] hh = new int[8], hl = new int[8];
		byte[] x = new byte[256];
		int i, b = n;
		long u;

		hh[0] = 0x6a09e667;
		hh[1] = 0xbb67ae85;
		hh[2] = 0x3c6ef372;
		hh[3] = 0xa54ff53a;
		hh[4] = 0x510e527f;
		hh[5] = 0x9b05688c;
		hh[6] = 0x1f83d9ab;
		hh[7] = 0x5be0cd19;

		hl[0] = 0xf3bcc908;
		hl[1] = 0x84caa73b;
		hl[2] = 0xfe94f82b;
		hl[3] = 0x5f1d36f1;
		hl[4] = 0xade682d1;
		hl[5] = 0x2b3e6c1f;
		hl[6] = 0xfb41bd6b;
		hl[7] = 0x137e2179;

		if (n >= 128) {
			crypto_hashblocks_hl(hh, hl, m, moff, n);
			n %= 128;
		}

		for (i = 0; i < n; i++)
			x[i] = m[b - n + i + moff];
		x[n] = (byte) 128;

		n = 256 - 128 * (n < 112 ? 1 : 0);
		x[n - 9] = 0;

		ts64(x, n - 8, b << 3/* (b / 0x20000000) | 0, b << 3 */);

		crypto_hashblocks_hl(hh, hl, x, 0, n);

		for (i = 0; i < 8; i++) {
			u = hh[i];
			u <<= 32;
			u |= hl[i] & 0xffffffffL;
			ts64(out, 8 * i, u);
		}

		return 0;
	}

	public static int crypto_hash(byte[] out, byte[] m) {
		return crypto_hash(out, m, 0, m != null ? m.length : 0);
	}

	// gf: long[16]
	/// private static void add(gf p[4],gf q[4])
	private static void add(long[] p[], long[] q[]) {
		long[] a = new long[16];
		long[] b = new long[16];
		long[] c = new long[16];
		long[] d = new long[16];
		long[] t = new long[16];
		long[] e = new long[16];
		long[] f = new long[16];
		long[] g = new long[16];
		long[] h = new long[16];

		long[] p0 = p[0];
		long[] p1 = p[1];
		long[] p2 = p[2];
		long[] p3 = p[3];

		long[] q0 = q[0];
		long[] q1 = q[1];
		long[] q2 = q[2];
		long[] q3 = q[3];

		Z(a, 0, p1, 0, p0, 0);
		Z(t, 0, q1, 0, q0, 0);
		M(a, 0, a, 0, t, 0);
		A(b, 0, p0, 0, p1, 0);
		A(t, 0, q0, 0, q1, 0);
		M(b, 0, b, 0, t, 0);
		M(c, 0, p3, 0, q3, 0);
		M(c, 0, c, 0, D2, 0);
		M(d, 0, p2, 0, q2, 0);

		A(d, 0, d, 0, d, 0);
		Z(e, 0, b, 0, a, 0);
		Z(f, 0, d, 0, c, 0);
		A(g, 0, d, 0, c, 0);
		A(h, 0, b, 0, a, 0);

		M(p0, 0, e, 0, f, 0);
		M(p1, 0, h, 0, g, 0);
		M(p2, 0, g, 0, f, 0);
		M(p3, 0, e, 0, h, 0);
	}

	private static void cswap(long[] p[], long[] q[], byte b) {
		int i;

		for (i = 0; i < 4; i++)
			sel25519(p[i], 0, q[i], 0, b);
	}

	private static void pack(byte[] r, long[] p[]) {
		long[] tx = new long[16];
		long[] ty = new long[16];
		long[] zi = new long[16];

		inv25519(zi, 0, p[2], 0);

		M(tx, 0, p[0], 0, zi, 0);
		M(ty, 0, p[1], 0, zi, 0);

		pack25519(r, ty, 0);

		r[31] ^= par25519(tx, 0) << 7;
	}

	private static void scalarmult(long[] p[], long[] q[], byte[] s, final int soff) {
		int i;

		set25519(p[0], gf0);
		set25519(p[1], gf1);
		set25519(p[2], gf1);
		set25519(p[3], gf0);

		for (i = 255; i >= 0; --i) {
			byte b = (byte) ((s[i / 8 + soff] >>> (i & 7)) & 1);

			cswap(p, q, b);
			add(q, p);
			add(p, p);
			cswap(p, q, b);
		}

		/// String dbgt = "";
		/// for (int dbg = 0; dbg < p.length; dbg ++) for (int dd = 0; dd <
		/// p[dbg].length; dd ++) dbgt += " "+p[dbg][dd];
		/// L/og.d(TAG, "scalarmult -> "+dbgt);
	}

	private static void scalarbase(long[] p[], byte[] s, final int soff) {
		long[][] q = new long[4][];

		q[0] = new long[16];
		q[1] = new long[16];
		q[2] = new long[16];
		q[3] = new long[16];

		set25519(q[0], X);
		set25519(q[1], Y);
		set25519(q[2], gf1);
		M(q[3], 0, X, 0, Y, 0);
		scalarmult(p, q, s, soff);
	}

	public static int crypto_sign_keypair(byte[] pk, byte[] sk, boolean seeded) {
		byte[] d = new byte[64];
		long[][] p = new long[4][];

		p[0] = new long[16];
		p[1] = new long[16];
		p[2] = new long[16];
		p[3] = new long[16];

		int i;

		if (!seeded)
			randombytes(sk, 32);
		crypto_hash(d, sk, 0, 32);
		d[0] &= 248;
		d[31] &= 127;
		d[31] |= 64;

		scalarbase(p, d, 0);
		pack(pk, p);

		for (i = 0; i < 32; i++)
			sk[i + 32] = pk[i];
		return 0;
	}

	private static final long L[] =
		{ 0xed, 0xd3, 0xf5, 0x5c, 0x1a, 0x63, 0x12, 0x58, 0xd6, 0x9c, 0xf7, 0xa2, 0xde, 0xf9, 0xde, 0x14, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0x10 };

	private static void modL(byte[] r, final int roff, long x[]) {
		long carry;
		int i, j;

		for (i = 63; i >= 32; --i) {
			carry = 0;
			for (j = i - 32; j < i - 12; ++j) {
				x[j] += carry - 16 * x[i] * L[j - (i - 32)];
				carry = (x[j] + 128) >> 8;
				x[j] -= carry << 8;
			}
			x[j] += carry;
			x[i] = 0;
		}
		carry = 0;

		for (j = 0; j < 32; j++) {
			x[j] += carry - (x[31] >> 4) * L[j];
			carry = x[j] >> 8;
			x[j] &= 255;
		}

		for (j = 0; j < 32; j++)
			x[j] -= carry * L[j];

		for (i = 0; i < 32; i++) {
			x[i + 1] += x[i] >> 8;
			r[i + roff] = (byte) (x[i] & 255);
		}
	}

	private static void reduce(byte[] r) {
		long[] x = new long[64];
		int i;

		for (i = 0; i < 64; i++)
			x[i] = (long) (r[i] & 0xff);

		for (i = 0; i < 64; i++)
			r[i] = 0;

		modL(r, 0, x);
	}

	// TBD... 64bits of n
	/// int crypto_sign(byte [] sm, long * smlen, byte [] m, long n, byte [] sk)
	public static int crypto_sign(byte[] sm, long dummy /* *smlen not used */, byte[] m, final int moff, int/* long */ n, byte[] sk) {
		byte[] d = new byte[64], h = new byte[64], r = new byte[64];

		int i, j;
		long[] x = new long[64];

		long[][] p = new long[4][];
		p[0] = new long[16];
		p[1] = new long[16];
		p[2] = new long[16];
		p[3] = new long[16];

		crypto_hash(d, sk, 0, 32);
		d[0] &= 248;
		d[31] &= 127;
		d[31] |= 64;

		/// *smlen = n+64;

		for (i = 0; i < n; i++)
			sm[64 + i] = m[i + moff];

		for (i = 0; i < 32; i++)
			sm[32 + i] = d[32 + i];

		crypto_hash(r, sm, 32, n + 32);
		reduce(r);
		scalarbase(p, r, 0);
		pack(sm, p);

		for (i = 0; i < 32; i++)
			sm[i + 32] = sk[i + 32];
		crypto_hash(h, sm, 0, n + 64);
		reduce(h);

		for (i = 0; i < 64; i++)
			x[i] = 0;

		for (i = 0; i < 32; i++)
			x[i] = (long) (r[i] & 0xff);

		for (i = 0; i < 32; i++)
			for (j = 0; j < 32; j++)
				x[i + j] += (h[i] & 0xff) * (long) (d[j] & 0xff);

		modL(sm, 32, x);

		return 0;
	}

	private static int unpackneg(long[] r[], byte p[]) {
		long[] t = new long[16];
		long[] chk = new long[16];
		long[] num = new long[16];
		long[] den = new long[16];
		long[] den2 = new long[16];
		long[] den4 = new long[16];
		long[] den6 = new long[16];

		set25519(r[2], gf1);
		unpack25519(r[1], p);
		S(num, r[1]);
		M(den, num, D);
		Z(num, num, r[2]);
		A(den, r[2], den);

		S(den2, den);
		S(den4, den2);
		M(den6, den4, den2);
		M(t, den6, num);
		M(t, t, den);

		pow2523(t, t);
		M(t, t, num);
		M(t, t, den);
		M(t, t, den);
		M(r[0], t, den);

		S(chk, r[0]);
		M(chk, chk, den);
		if (neq25519(chk, num) != 0)
			M(r[0], r[0], I);

		S(chk, r[0]);
		M(chk, chk, den);
		if (neq25519(chk, num) != 0)
			return -1;

		if (par25519(r[0]) == ((p[31] & 0xFF) >>> 7))
			Z(r[0], gf0, r[0]);

		M(r[3], r[0], r[1]);

		return 0;
	}

	/// TBD 64bits of mlen
	/// int crypto_sign_open(byte []m,long *mlen,byte []sm,long n,byte []pk)
	public static int crypto_sign_open(byte[] m, long dummy /* *mlen not used */, byte[] sm, final int smoff, int/* long */ n, byte[] pk) {
		int i;
		byte[] t = new byte[32], h = new byte[64];

		long[][] p = new long[4][];
		p[0] = new long[16];
		p[1] = new long[16];
		p[2] = new long[16];
		p[3] = new long[16];

		long[][] q = new long[4][];
		q[0] = new long[16];
		q[1] = new long[16];
		q[2] = new long[16];
		q[3] = new long[16];

		/// *mlen = -1;

		if (n < 64)
			return -1;

		if (unpackneg(q, pk) != 0)
			return -1;

		for (i = 0; i < n; i++)
			m[i] = sm[i + smoff];

		for (i = 0; i < 32; i++)
			m[i + 32] = pk[i];

		crypto_hash(h, m, 0, n);

		reduce(h);
		scalarmult(p, q, h, 0);

		scalarbase(q, sm, 32 + smoff);
		add(p, q);
		pack(t, p);

		n -= 64;
		if (crypto_verify_32(sm, smoff, t, 0) != 0) {
			// optimizing it
			/// for (i = 0; i < n; i ++) m[i] = 0;
			return -1;
		}

		// TBD optimizing ...
		/// for (i = 0; i < n; i ++) m[i] = sm[i + 64 + smoff];
		/// *mlen = n;

		return 0;
	}

	static final SecureRandom gr = GlobalRandom.getGlobalInsecureRandom();

	public static byte[] randombytes(byte[] x) {
		gr.nextBytes(x);
		return x;
	}

	public static byte[] randombytes(int len) {
		return randombytes(new byte[len]);
	}

	public static byte[] randombytes(byte[] x, int len) {
		byte[] b = randombytes(len);
		System.arraycopy(b, 0, x, 0, len);
		return x;
	}

	/*
	 * public static byte[] randombytes(byte [] x, int len) { int ret = len % 8;
	 * long rnd;
	 * 
	 * for (int i = 0; i < len-ret; i += 8) { rnd = jrandom.nextLong();
	 * 
	 * x[i+0] = (byte) (rnd >>> 0); x[i+1] = (byte) (rnd >>> 8); x[i+2] = (byte)
	 * (rnd >>> 16); x[i+3] = (byte) (rnd >>> 24); x[i+4] = (byte) (rnd >>> 32);
	 * x[i+5] = (byte) (rnd >>> 40); x[i+6] = (byte) (rnd >>> 48); x[i+7] = (byte)
	 * (rnd >>> 56); }
	 * 
	 * if (ret > 0) { rnd = jrandom.nextLong(); for (int i = len-ret; i < len; i ++)
	 * x[i] = (byte) (rnd >>> 8*i); } return x; }
	 */

	public static byte[] makeBoxNonce() {
		return randombytes(Box.nonceLength);
	}

	public static byte[] makeSecretBoxNonce() {
		return randombytes(SecretBox.nonceLength);
	}

	public static String base64EncodeToString(byte[] b) {
		return Base64.encodeBase64String(b);
	}
	// byte[] Base64.getUrlEncoder().withoutPadding().encode(b);

	public static byte[] base64Decode(String s) {
		return Base64.decodeBase64(s);
	}
	// byte[] Base64.getUrlDecoder().decode(byte[] b)

	public static String hexEncodeToString(byte[] raw) {
		String HEXES = "0123456789ABCDEF";
		final StringBuilder hex = new StringBuilder(2 * raw.length);
		for (final byte b : raw) {
			hex.append(HEXES.charAt((b & 0xF0) >> 4)).append(HEXES.charAt((b & 0x0F)));
		}
		return hex.toString();
	}

	public static byte[] hexDecode(String s) {
		byte[] b = new byte[s.length() / 2];
		for (int i = 0; i < s.length(); i += 2) {
			b[i / 2] = (byte) ((Character.digit(s.charAt(i), 16) << 4) + Character.digit(s.charAt(i + 1), 16));
		}
		return b;
	}
}
